Bug fixed in ReplaceMissingValues

d8b4f0d1 · panos · Jérome Perrin · 904f5823 · 904f5823 · 904f5823
Commit d8b4f0d1 authored Jun 12, 2014 by panos Committed by Jérome Perrin Jun 17, 2014
5 changed files
--- a/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/CMSD_Topology10.xml
+++ b/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/CMSD_Topology10.xml
-<?xml version='1.0' encoding='utf8'?>
-<CMSDDocument>
-
-	<DataSection>
-		<PartType>
-			<Identifier>Part1</Identifier>
-		</PartType>
-		<PartType>
-			<Identifier>UnfinishedPart1</Identifier>
-		</PartType>
-	     <Resource>
-			<Identifier>S1</Identifier>
-			<Description>The source of the topology</Description>
-			<ResourceType>Source</ResourceType>
-			<Name>RawMaterial</Name>
-		 </Resource>
-		<Resource>
-			<Identifier>M1</Identifier>
-			<Description>The lathe of the topology</Description>
-			<ResourceType>Machine</ResourceType>
-			<Name>Machine1</Name>
-		 </Resource>
-		<Resource>
-			<Identifier>M2</Identifier>
-			<Description>The moulding machine of the topology</Description>
-			<ResourceType>Machine</ResourceType>
-			<Name>Machine2</Name>
-		 </Resource>
-		<Resource>
-			<Identifier>Queue</Identifier>
-			<Description>The queue of the topology</Description>
-			<ResourceType>Queue</ResourceType>
-			<Name>Queue</Name>
-		 </Resource>
-		<Resource>
-			<Identifier>Exit</Identifier>
-			<Description>The exit of the topology</Description>
-			<ResourceType>Exit</ResourceType>
-			<Name>Stock</Name>
-		 </Resource>		 
-		
-		<Resource>
-			<Identifier>A</Identifier>
-			<ResourceType>employee</ResourceType>
-		</Resource>
-		<Resource>
-			<Identifier>B</Identifier>
-			<ResourceType>employee</ResourceType>
-		</Resource>
-		<Resource>
-			<Identifier>Repairman</Identifier>
-			<Description>This element describes a class of employees</Description>
-			<ResourceType>employee</ResourceType>
-			<Name>W1</Name>
-		</Resource>
-********************************Process Plan*****************************************************		
-		<ProcessPlan>
-			<Identifier>ProcessPlan:Part1</Identifier>
-			<PartsProduced>
-				<Description>The part produced the process</Description>
-				<PartType>
-					<PartTypeIdentifier>Part1</PartTypeIdentifier>
-				</PartType>
-				<PartQuantity>1</PartQuantity>
-			</PartsProduced>
-			<PartsConsumed>
-				<Description>The part(s) consumed the process</Description>
-				<PartType>
-					<PartTypeIdentifier>UnfinishedPart1</PartTypeIdentifier>
-				</PartType>
-				<PartQuantity>1</PartQuantity>
-			</PartsConsumed>
-			<FirstProcess>
-				<ProcessIdentifier>MainProcessSequence</ProcessIdentifier>
-			</FirstProcess>
-			<Process>
-				<Identifier>MainProcessSequence</Identifier>
-				<RepetitionCount>1</RepetitionCount>
-				<SubProcessGroup>
-					<Type>sequence</Type>
-					<Process>
-						<ProcessIdentifier>A010</ProcessIdentifier>
-					</Process>
-					<Process>
-						<ProcessIdentifier>A020</ProcessIdentifier>
-					</Process>
-					<Process>
-						<ProcessIdentifier>A030</ProcessIdentifier>
-					</Process>
-					<Process>
-						<ProcessIdentifier>A040</ProcessIdentifier>
-					</Process>
-					<Process>
-						<ProcessIdentifier>A050</ProcessIdentifier>
-					</Process>
-				</SubProcessGroup>
-			</Process>
-***********************************************Process************************************************			
-			<Process>
-				<Identifier>A010</Identifier>
-				<Description>Process 1</Description>
-				<ResourcesRequired>
-					<Description>Source</Description>
-					<Resource>
-						<ResourceIdentifier>S1</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-				<Property>
-					<Name>interarrivalTime</Name>
-					<Unit>minutes</Unit>
-					<Distribution>
-						<Name>Fixed</Name>
-						<DistributionParameter>
-						    <Name>mean</Name>
-							<Value>0.5</Value>
-						</DistributionParameter>
-					</Distribution>
-				</Property>
-				<Property>
-					<Name>partType</Name>
-					<Value>Part</Value>
-				</Property>
-			</Process>
-	
-			<Process>
-				<Identifier>A020</Identifier>
-				<Description>Process 2</Description>
-				<PartsProduced>
-					<Description>...</Description>
-					<PartType>
-						<PartTypeIdentifier>UnfinishedPart1</PartTypeIdentifier>
-					</PartType>
-					<PartQuantity>1</PartQuantity>
-				</PartsProduced>
-				<PartsConsumed>
-					<Description>...</Description>
-					<PartType>
-						<PartTypeIdentifier>UnfinishedPart1</PartTypeIdentifier>
-					</PartType>
-					<PartQuantity>1</PartQuantity>
-				</PartsConsumed>
-				<ResourcesRequired>
-					<Description>The employee performing the operation.</Description>
-					<Resource>
-						<ResourceIdentifier>A</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-				<ResourcesRequired>
-					<Description>Machine1.</Description>
-					<Resource>
-						<ResourceIdentifier>M1</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-				<OperationTime>
-					<Unit>minutes</Unit>
-					<Distribution>
-					<Name></Name>
-						<DistributionParameterA>
-							<Name></Name>
-							<Value></Value>
-						</DistributionParameterA>
-						<DistributionParameterB>
-							<Name></Name>
-							<Value></Value>
-						</DistributionParameterB>
-					</Distribution>
-				</OperationTime>
-				<Property>
-					<Name>MeanTimeToFailure</Name>
-					<Unit>minutes</Unit>
-					<Distribution>
-						<Name>Fixed</Name>
-						<DistributionParameter>
-							<Name>mean</Name>
-							<Value>60</Value>
-						</DistributionParameter>
-					</Distribution>
-				</Property>
-				<Property>
-					<Name>MeanTimeToRepair</Name>
-					<Unit>minutes</Unit>
-					<Distribution>
-						<Name>Fixed</Name>
-						<DistributionParameter>
-							<Name>mean</Name>
-							<Value>5</Value>
-						</DistributionParameter>
-					</Distribution>
-					<Property>
-						<Name>RepairmanRequired</Name>
-						<ResourcesRequired>
-							<Description>The employee performing the operation.</Description>
-							<ResourceIdentifier>W1</ResourceIdentifier>
-						</ResourcesRequired>
-					</Property>
-				</Property>
-			</Process>
-			
-			<Process>
-				<Identifier>A030</Identifier>
-				<Description>Process 3</Description>
-				<ResourcesRequired>
-					<Description>Queue1.</Description>
-					<Resource>
-						<ResourceIdentifier>Q1</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-				<Property>
-					<Name>capacity</Name>
-					<Value>1</Value>
-				</Property>
-			</Process>	
-				
-			<Process>
-				<Identifier>A040</Identifier>
-				<Description>Process 4</Description>
-				<PartsProduced>
-					<Description>...</Description>
-					<PartType>
-						<PartTypeIdentifier>UnfinishedPart1</PartTypeIdentifier>
-					</PartType>
-					<PartQuantity>1</PartQuantity>
-				</PartsProduced>
-				<PartsConsumed>
-					<Description>...</Description>
-					<PartType>
-						<PartTypeIdentifier>UnfinishedPart1</PartTypeIdentifier>
-					</PartType>
-					<PartQuantity>1</PartQuantity>
-				</PartsConsumed>
-				<ResourcesRequired>
-					<Description>The employee performing the operation.</Description>
-					<Resource>
-						<ResourceIdentifier>B</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-				<ResourcesRequired>
-					<Description>Machine2.</Description>
-					<Resource>
-						<ResourceIdentifier>M2</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-				<OperationTime>
-					<Unit>minutes</Unit>
-					<Distribution>
-					<Name></Name>
-						<DistributionParameterA>
-							<Name></Name>
-							<Value></Value>
-						</DistributionParameterA>
-						<DistributionParameterB>
-							<Name></Name>
-							<Value></Value>
-						</DistributionParameterB>
-					</Distribution>
-				</OperationTime>
-				<Property>
-					<Name>MeanTimeToFailure</Name>
-					<Unit>minutes</Unit>
-					<Distribution>
-						<Name>Fixed</Name>
-						<DistributionParameter>
-							<Name>mean</Name>
-							<Value>40</Value>
-						</DistributionParameter>
-					</Distribution>
-				</Property>
-				<Property>
-					<Name>MeanTimeToRepair</Name>
-					<Unit>minutes</Unit>
-					<Distribution>
-						<Name>Fixed</Name>
-						<DistributionParameter>
-							<Name>mean</Name>
-							<Value>10</Value>
-						</DistributionParameter>
-					</Distribution>
-					<Property>
-						<Name>RepairmanRequired</Name>
-						<ResourcesRequired>
-							<Description>The employee performing the operation.</Description>
-							<ResourceIdentifier>W1</ResourceIdentifier>
-						</ResourcesRequired>
-					</Property>
-				</Property>
-			</Process>
-		
-			<Process>
-				<Identifier>A050</Identifier>
-				<Description>Process 5</Description>
-				<ResourcesRequired>
-					<Description>Exit.</Description>
-					<Resource>
-						<ResourceIdentifier>E1</ResourceIdentifier>
-					</Resource>
-				</ResourcesRequired>
-			</Process>
-		</ProcessPlan>
-	</DataSection>
-</CMSDDocument>
\ No newline at end of file
--- a/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/JSON_Topology10.json
+++ b/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/JSON_Topology10.json
-{
- "modelResource": [
-  {
-   "_class": "Dream.Repairman", 
-   "capacity": "1", 
-   "id": "W1", 
-   "name": "W1"
-  }
- ], 
- "_class": "Dream.Simulation", 
- "coreObject": [
-  {
-   "name": "Raw Material", 
-   "entity": "Part", 
-   "interarrivalTime": {
-    "distributionType": "Fixed", 
-    "mean": "0.5"
-   }, 
-   "successorList": [
-    "DummyQ"
-   ], 
-   "_class": "Dream.Source", 
-   "id": "S1"
-  }, 
-  {
-   "predecessorList": [
-    "DummyQ"
-   ], 
-   "name": "Machine1", 
-   "processingTime": {
-
-   }, 
-   "successorList": [
-    "Q1"
-   ], 
-   "failures": {
-    "MTTR": "5", 
-    "failureDistribution": "Fixed", 
-    "repairman": "W1", 
-    "MTTF": "60"
-   }, 
-   "_class": "Dream.Machine", 
-   "id": "M1"
-  }, 
-  {
-   "predecessorList": [
-    "Q1"
-   ], 
-   "name": "Machine2", 
-   "processingTime": {
-    
-   }, 
-   "successorList": [
-    "E1"
-   ], 
-   "failures": {
-    "MTTR": "10", 
-    "failureDistribution": "Fixed", 
-    "repairman": "W1", 
-    "MTTF": "40"
-   }, 
-   "_class": "Dream.Machine", 
-   "id": "M2"
-  }, 
-  {
-   "capacity": "1", 
-   "name": "DummyQ", 
-   "isDummy": "True", 
-   "predecessorList": [
-    "S1"
-   ], 
-   "successorList": [
-    "M1"
-   ], 
-   "_class": "Dream.Queue", 
-   "id": "DummyQ"
-  }, 
-  {
-   "capacity": "1", 
-   "name": "Q1", 
-   "isDummy": "False", 
-   "predecessorList": [
-    "M1"
-   ], 
-   "successorList": [
-    "M2"
-   ], 
-   "_class": "Dream.Queue", 
-   "id": "Q1"
-  }, 
-  {
-   "predecessorList": [
-    "M2"
-   ], 
-   "_class": "Dream.Exit", 
-   "id": "E1", 
-   "name": "Stock"
-  }
- ], 
- "general": {
-  "trace": "Yes", 
-  "_class": "Dream.Configuration", 
-  "numberOfReplications": "1", 
-  "maxSimTime": "1440", 
-  "confidenceLevel": "0.95"
- }
-}
\ No newline at end of file
--- a/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/KnowledgeExtractionTool_example.py
+++ b/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/KnowledgeExtractionTool_example.py
-'''
-Created on 19 Feb 2014
-
-@author: Panos
-'''
-# ===========================================================================
-# Copyright 2013 University of Limerick
-#
-# This file is part of DREAM.
-#
-# DREAM is free software: you can redistribute it and/or modify
-# it under the terms of the GNU Lesser General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# DREAM is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU Lesser General Public License for more details.
-#
-# You should have received a copy of the GNU Lesser General Public License
-# along with DREAM.  If not, see <http://www.gnu.org/licenses/>.
-# ===========================================================================
-
-from ImportExceldata import Import_Excel
-from DistributionFitting import DistFittest
-from xml.etree import ElementTree as et
-from ExcelOutput import Output
-from ReplaceMissingValues import HandleMissingValues
-import xlrd
-import json
-
-#================================================ This script is a simple example of the Knowledge extraction tool ===============================================================#
-
-#The following is the Main script, that calls two Python objects in order to conduct the three main components of the Knowledge extraction tool
-#In the following example the operation times of the topology's two machines are given in an Excel document. 
-#Import_Excel object imports data from the Excel document to the tool and DistFittest object fits the data to a statistical distribution using Kolmogorov-Smirnov test
-   
-workbook = xlrd.open_workbook('inputsKEtool.xls')      #Using xlrd library opens the Excel document with the input data 
-worksheets = workbook.sheet_names()
-worksheet_OperationTime = worksheets[0]             #It creates a variable that holds the first Excel worksheet 
- 
-X=Import_Excel()                                    #Call the import_Excel object
-OperationTimes= X.Input_data(worksheet_OperationTime,workbook)      #It defines a Python dictionary, giving as name OpearationTimes and as value the returned dictionary from the import_Excel object 
-Machine1_OpearationTimes = OperationTimes.get('Machine1',[])        #Two lists are defined (Machine1_OpearationTimes, Machine2_OpearationTimes) with the operation times data of each machine
-Machine2_OpearationTimes = OperationTimes.get('Machine2',[])
-
-A=HandleMissingValues()                                     #Call the HandleMissingValues object
-Machine1_OpearationTimes= A.DeleteMissingValue(Machine1_OpearationTimes)        #It deletes the missing values in the lists with the operation times data
-Machine2_OpearationTimes= A.DeleteMissingValue(Machine2_OpearationTimes)
-
-Dict={}
-B=DistFittest()                                     #It calls the DistFittest object
-Dict['M1']=B.ks_test(Machine1_OpearationTimes)                 #It conducts the Kolmogorov-Smirnov test in the list with the operation times data 
-Dict['M2']=B.ks_test(Machine2_OpearationTimes)
-M1=Dict.get('M1')
-M2=Dict.get('M2')
-
-
-#==================================== Output preparation: output the updated values in the CMSD information model of Topology10 ====================================================#
-
-datafile=('CMSD_Topology10.xml')       #It defines the name or the directory of the XML file that is manually written the CMSD information model
-tree = et.parse(datafile)                                               #This file will be parsed using the XML.ETREE Python library
-
-M1Parameters=[]
-M1ParameterValue=[]
-for index in list(Dict['M1'].keys()):
-    if index is not 'distributionType':
-        M1Parameters.append(index)
-        M1ParameterValue.append(Dict['M1'][index])
-if Dict['M1']['distributionType']=='Normal':
-    del M1['min']
-    del M1['max']
-elif Dict['M2']['distributionType']=='Normal':
-    del M2['min']
-    del M2['max']
-
-M2Parameters=[]
-M2ParameterValue=[]
-for index in list(Dict['M2'].keys()):
-    if index is not 'distributionType':
-        M2Parameters.append(index)
-        M2ParameterValue.append(Dict['M2'][index])       
-
-root=tree.getroot()
-process=tree.findall('./DataSection/ProcessPlan/Process')               #It creates a new variable and using the 'findall' order in XML.ETREE library, this new variable holds all the processes defined in the XML file
-for process in process:
-    process_identifier=process.find('Identifier').text                  #It creates a new variable that holds the text of the Identifier element in the XML file
-    if process_identifier=='A020':                                      #It checks using if...elif syntax if the process identifier is 'A020', so the process that uses the first machine
-        OperationTime=process.get('OpeationTime')                       #It gets the element attribute OpearationTime inside the Process node
-        Distribution=process.get('./OperationTime/Distribution')        #It gets the element attribute Distribution inside the OpearationTime node
-        Name=process.find('./OperationTime/Distribution/Name')          #It finds the subelement Name inside the Distribution attribute
-        Name.text=Dict['M1']['distributionType']                                     #It changes the text between the Name element tags, putting the name of the distribution (e.g. in Normal distribution that will be Normal) 
-        DistributionParameterA=process.get('./OperationTime/Distribution/DistributionParameterA')
-        Name=process.find('./OperationTime/Distribution/DistributionParameterA/Name')
-        Name.text=str(M1Parameters[0])                               #It changes the text between the Name element tags, putting the name of the distribution's first parameter (e.g. in Normal that will be the mean)
-        Value=process.find('./OperationTime/Distribution/DistributionParameterA/Value')
-        Value.text=str(M1ParameterValue[0])                          #It changes the text between the Value element tags, putting the value of the distribution's first parameter (e.g. in Normal so for mean value that will be 5.0)
-        DistributionParameterB=process.get('./OperationTime/Distribution/DistributionParameterB')
-        Name=process.find('./OperationTime/Distribution/DistributionParameterB/Name')
-        Name.text=str(M1Parameters[1])                                #It changes the text between the Name element tags, putting the name of the distribution's second parameter (e.g. in Normal that will be the standarddeviation)
-        Value=process.find('./OperationTime/Distribution/DistributionParameterB/Value')
-        Value.text=str(M1ParameterValue[1])                           #It changes the text between the Value element tags, putting the value of the distribution's second parameter (e.g. in Normal so for standarddeviation value that will be 1.3)
-    elif process_identifier=='A040':                                #It checks using if...elif syntax if the process identifier is 'A040', so the process that uses the second machine 
-        OperationTime=process.get('OpeationTime')
-        Distribution=process.get('./OperationTime/Distribution')
-        Name=process.find('./OperationTime/Distribution/Name')
-        Name.text=Dict['M2']['distributionType'] 
-        DistributionParameterA=process.get('./OperationTime/Distribution/DistributionParameterA')
-        Name=process.find('./OperationTime/Distribution/DistributionParameterA/Name')
-        Name.text=str(M2Parameters[0]) 
-        Value=process.find('./OperationTime/Distribution/DistributionParameterA/Value')
-        Value.text=str(M2ParameterValue[0]) 
-        DistributionParameterB=process.get('./OperationTime/Distribution/DistributionParameterB')
-        Name=process.find('./OperationTime/Distribution/DistributionParameterB/Name')
-        Name.text=str(M2Parameters[1]) 
-        Value=process.find('./OperationTime/Distribution/DistributionParameterB/Value')
-        Value.text=str(M2ParameterValue[1]) 
-    else:
-        continue
-    tree.write('CMSD_Topology10_Output.xml',encoding="utf8")                         #It writes the element tree to a specified file, using the 'utf8' output encoding
-
-#================================= Output preparation: output the updated values in the JSON file of Topology10 =========================================================#
-jsonFile= open('JSON_Topology10.json','r')      #It opens the Topology10 JSON file 
-data = json.load(jsonFile)                                                              #It loads the file
-jsonFile.close()
-nodes=data.get('coreObject',[])                                                         #It creates a variable that holds the 'coreObject' list
-
-for element in nodes:
-    name=element.get('name')                                                            #It creates a variable that gets the element attribute 'name'
-    processingTime=element.get('processingTime',{})                                     #It creates a variable that gets the element attribute 'processingTime'
-        
-    if name =='Machine1':
-        element['processingTime']=Dict['M1']                            #It checks using if...elif syntax if the name is 'Machine1', so the first machine in the Topology10
-    elif name=='Machine2':                        
-        element['processingTime']=Dict['M2']
-    else:
-        continue                            
-        
-    jsonFile = open('JSON_Topology10_Output.json',"w")     #It opens the JSON file
-    jsonFile.write(json.dumps(data, indent=True))                                           #It writes the updated data to the JSON file 
-    jsonFile.close()                                                                        #It closes the file
-        
-#================================ Calling the ExcelOutput object, outputs the outcomes of the statistical analysis in Excel files =============================================#
-C=Output()
-C.PrintDistributionFit(Machine1_OpearationTimes,'Machine1_DistFitResults.xls')   
-C.PrintStatisticalMeasures(Machine1_OpearationTimes,'Machine1_StatResults.xls')
-C.PrintDistributionFit(Machine2_OpearationTimes,'Machine2_DistFitResults.xls')   
-C.PrintStatisticalMeasures(Machine2_OpearationTimes,'Machine2_StatResults.xls')
-
-    
\ No newline at end of file
--- a/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/inputsKEtool.xls
+++ b/dream/KnowledgeExtraction/KnowledgeExtractionTool_example/inputsKEtool.xls
--- a/dream/KnowledgeExtraction/ReplaceMissingValues.py
+++ b/dream/KnowledgeExtraction/ReplaceMissingValues.py
@@ -47,7 +47,6 @@ class HandleMissingValues(BasicStatisticalMeasures):
    def ReplaceWithMean(self,mylist):          #Replace in the given list the missing values with the mean value  
        list1=self.DeleteMissingValue(mylist)  #Create a new list, which is the given list deleting the missing values (calling the DeleteMissingValue method)
        mean=sum(list1)/float(len(list1))      #Calculate the mean value of the new list
-        print mean
        i=0
        for value in mylist:
            if value is '' :