schain-jc Commit - r1206:59caf7a2130e

Writing Unit for Madrigal decorated (just for python 2x)

George Yong -

r1206:59caf7a2130e

parent child

Context file:

r1206:59caf7a2130e

Collapse all files

The requested changes are too big and content was truncated. Show full diff

schainpy/model/io/jroIO_madrigal.py +24 -21

              '''
              Created on Aug 1, 2017
              @author: Juan C. Espinoza
              '''
              import os
              import sys
              import time
              import json
              import glob
              import datetime
              import numpy
              import h5py
-             from schainpy.model.io.jroIO_base import JRODataReader
+             from schainpy.model.io.jroIO_base import LOCALTIME, JRODataReader, JRODataWriter
              from schainpy.model.proc.jroproc_base import ProcessingUnit, Operation, MPDecorator
              from schainpy.model.data.jrodata import Parameters
              from schainpy.utils import log
              try:
                  import madrigal.cedar
              except:
                  log.warning(
                      'You should install "madrigal library" module if you want to read/write Madrigal data'
                      )
              DEF_CATALOG = {
                  'principleInvestigator': 'Marco Milla',
-                 'expPurpose': None,
-                 'cycleTime': None,
-                 'correlativeExp': None,
-                 'sciRemarks': None,
-                 'instRemarks': None
+                 'expPurpose': '',
+                 'cycleTime': '',
+                 'correlativeExp': '',
+                 'sciRemarks': '',
+                 'instRemarks': ''
                  }
              DEF_HEADER = {
-                 'kindatDesc': None,
+                 'kindatDesc': '',
                  'analyst': 'Jicamarca User',
-                 'comments': None,
-                 'history': None
+                 'comments': '',
+                 'history': ''
                  }
              MNEMONICS = {
 : 'jro',
 : 'jbr',
 : 'jul',
 : 'jas',
 : 'pbr',
 : 'hbr',
 : 'obr',
+: 'clr'
              }
              UT1970 = datetime.datetime(1970, 1, 1) - datetime.timedelta(seconds=time.timezone)
              def load_json(obj):
                  '''
                  Parse json as string instead of unicode
                  '''
                  if isinstance(obj, str):
                      iterable = json.loads(obj)
                  else:
                      iterable = obj
                  if isinstance(iterable, dict):
-                     return {str(k): load_json(v) if isinstance(v, dict) else str(v) if isinstance(v, str) else v
+                     return {str(k): load_json(v) if isinstance(v, dict) else str(v) if isinstance(v, (str,unicode)) else v
                          for k, v in list(iterable.items())}
                  elif isinstance(iterable, (list, tuple)):
                      return [str(v) if isinstance(v, str) else v for v in iterable]
                  return iterable
              @MPDecorator
              class MADReader(JRODataReader, ProcessingUnit):
                  def __init__(self):
                      ProcessingUnit.__init__(self)
                      self.dataOut = Parameters()
                      self.counter_records = 0
                      self.nrecords = None
                      self.flagNoMoreFiles = 0
                      self.isConfig = False
                      self.filename = None
                      self.intervals = set()
                  def setup(self,
                            path=None,
                            startDate=None,
                            endDate=None,
                            format=None,
                            startTime=datetime.time(0, 0, 0),
                            endTime=datetime.time(23, 59, 59),
                            **kwargs):
                      self.path = path
                      self.startDate = startDate
                      self.endDate = endDate
                      self.startTime = startTime
                      self.endTime = endTime
                      self.datatime = datetime.datetime(1900,1,1)
                      self.oneDDict = load_json(kwargs.get('oneDDict',
                                                           "{\"GDLATR\":\"lat\", \"GDLONR\":\"lon\"}"))
                      self.twoDDict = load_json(kwargs.get('twoDDict',
                                                           "{\"GDALT\": \"heightList\"}"))
                      self.ind2DList = load_json(kwargs.get('ind2DList',
                                                            "[\"GDALT\"]"))
                      if self.path is None:
                          raise ValueError('The path is not valid')
                      if format is None:
                          raise ValueError('The format is not valid choose simple or hdf5')
                      elif format.lower() in ('simple', 'txt'):
                          self.ext = '.txt'
                      elif format.lower() in ('cedar',):
                          self.ext = '.001'
                      else:
                          self.ext = '.hdf5'
                      self.search_files(self.path)
                      self.fileId = 0
                      if not self.fileList:
                          raise  Warning('There is no files matching these date in the folder: {}. \n Check startDate and endDate'.format(path))
                      self.setNextFile()
                  def search_files(self, path):
                      '''
                       Searching for madrigal files in path
                       Creating a list of files to procces included in [startDate,endDate]
                       Input:
                           path - Path to find files
                      '''
                      log.log('Searching files {} in {} '.format(self.ext, path), 'MADReader')
                      foldercounter = 0
                      fileList0 = glob.glob1(path, '*{}'.format(self.ext))
                      fileList0.sort()
                      self.fileList = []
                      self.dateFileList = []
                      startDate = self.startDate - datetime.timedelta(1)
                      endDate = self.endDate + datetime.timedelta(1)
                      for thisFile in fileList0:
                          year = thisFile[3:7]
                          if not year.isdigit():
                              continue
                          month = thisFile[7:9]
                          if not month.isdigit():
                              continue
                          day = thisFile[9:11]
                          if not day.isdigit():
                              continue
                          year, month, day = int(year), int(month), int(day)
                          dateFile = datetime.date(year, month, day)
                          if (startDate > dateFile) or (endDate < dateFile):
                              continue
                          self.fileList.append(thisFile)
                          self.dateFileList.append(dateFile)
                      return
                  def parseHeader(self):
                      '''
                      '''
                      self.output = {}
                      self.version = '2'
                      s_parameters = None
                      if self.ext == '.txt':
                          self.parameters = [s.strip().lower() for s in self.fp.readline().strip().split(' ') if s]
                      elif self.ext == '.hdf5':
                          metadata = self.fp['Metadata']
                          data = self.fp['Data']['Array Layout']
                          if 'Independent Spatial Parameters' in metadata:
                              s_parameters = [s[0].lower() for s in metadata['Independent Spatial Parameters']]
                              self.version = '3'
                          one = [s[0].lower() for s in data['1D Parameters']['Data Parameters']]
                          one_d = [1 for s in one]
                          two = [s[0].lower() for s in data['2D Parameters']['Data Parameters']]
                          two_d = [2 for s in two]
                          self.parameters = one + two
                          self.parameters_d = one_d + two_d
-                     log.success('Parameters found: {}'.format(','.join(str(self.parameters))),
+                     log.success('Parameters found: {}'.format(self.parameters),
                                  'MADReader')
                      if s_parameters:
                          log.success('Spatial parameters: {}'.format(','.join(str(s_parameters))),
                                      'MADReader')
                      for param in list(self.oneDDict.keys()):
                          if param.lower() not in self.parameters:
                              log.warning(
                                  'Parameter {} not found will be ignored'.format(
                                      param),
                                  'MADReader')
                              self.oneDDict.pop(param, None)
                      for param, value in list(self.twoDDict.items()):
                          if param.lower() not in self.parameters:
                              log.warning(
                                  'Parameter {} not found, it will be ignored'.format(
                                      param),
                                  'MADReader')
                              self.twoDDict.pop(param, None)
                              continue
                          if isinstance(value, list):
                              if value[0] not in self.output:
                                  self.output[value[0]] = []
                              self.output[value[0]].append(None)
                  def parseData(self):
                      '''
                      '''
                      if self.ext == '.txt':
                          self.data = numpy.genfromtxt(self.fp, missing_values=('missing'))
                          self.nrecords = self.data.shape[0]
                          self.ranges = numpy.unique(self.data[:,self.parameters.index(self.ind2DList[0].lower())])
                      elif self.ext == '.hdf5':
                          self.data = self.fp['Data']['Array Layout']
                          self.nrecords = len(self.data['timestamps'].value)
                          self.ranges = self.data['range'].value
                  def setNextFile(self):
                      '''
                      '''
                      file_id = self.fileId
                      if file_id == len(self.fileList):
                          log.success('No more files', 'MADReader')
                          self.flagNoMoreFiles = 1
                          return 0
                      log.success(
                          'Opening: {}'.format(self.fileList[file_id]),
                          'MADReader'
                          )
                      filename = os.path.join(self.path, self.fileList[file_id])
                      if self.filename is not None:
                          self.fp.close()
                      self.filename = filename
                      self.filedate = self.dateFileList[file_id]
                      if self.ext=='.hdf5':
                          self.fp = h5py.File(self.filename, 'r')
                      else:
                          self.fp = open(self.filename, 'rb')
                      self.parseHeader()
                      self.parseData()
                      self.sizeOfFile = os.path.getsize(self.filename)
                      self.counter_records = 0
                      self.flagIsNewFile = 0
                      self.fileId += 1
                      return 1
                  def readNextBlock(self):
                      while True:
                          self.flagDiscontinuousBlock = 0
                          if self.flagIsNewFile:
                              if not self.setNextFile():
                                  return 0
                          self.readBlock()
                          if (self.datatime < datetime.datetime.combine(self.startDate, self.startTime)) or \
                             (self.datatime > datetime.datetime.combine(self.endDate, self.endTime)):
                              log.warning(
                                  'Reading Record No. {}/{} -> {} [Skipping]'.format(
                                      self.counter_records,
                                      self.nrecords,
                                      self.datatime.ctime()),
                                  'MADReader')
                              continue
                          break
                      log.log(
                          'Reading Record No. {}/{} -> {}'.format(
                              self.counter_records,
                              self.nrecords,
                              self.datatime.ctime()),
                          'MADReader')
                      return 1
                  def readBlock(self):
                      '''
                      '''
                      dum = []
                      if self.ext == '.txt':
                          dt = self.data[self.counter_records][:6].astype(int)
                          if datetime.datetime(dt[0], dt[1], dt[2], dt[3], dt[4], dt[5]).date() > self.datatime.date():
                              self.flagDiscontinuousBlock = 1
                          self.datatime = datetime.datetime(dt[0], dt[1], dt[2], dt[3], dt[4], dt[5])
                          while True:
                              dt = self.data[self.counter_records][:6].astype(int)
                              datatime = datetime.datetime(dt[0], dt[1], dt[2], dt[3], dt[4], dt[5])
                              if datatime == self.datatime:
                                  dum.append(self.data[self.counter_records])
                                  self.counter_records += 1
                                  if self.counter_records == self.nrecords:
                                      self.flagIsNewFile = True
                                      break
                                  continue
                              self.intervals.add((datatime-self.datatime).seconds)
                              break
                      elif self.ext == '.hdf5':
                          datatime = datetime.datetime.utcfromtimestamp(
                              self.data['timestamps'][self.counter_records])
                          nHeights = len(self.ranges)
                          for n, param in enumerate(self.parameters):
                              if self.parameters_d[n] == 1:
                                  dum.append(numpy.ones(nHeights)*self.data['1D Parameters'][param][self.counter_records])
                              else:
                                  if self.version == '2':
                                      dum.append(self.data['2D Parameters'][param][self.counter_records])
                                  else:
                                      tmp = self.data['2D Parameters'][param].value.T
                                      dum.append(tmp[self.counter_records])
                          self.intervals.add((datatime-self.datatime).seconds)
                          if datatime.date()>self.datatime.date():
                              self.flagDiscontinuousBlock = 1
                          self.datatime = datatime
                          self.counter_records += 1
                          if self.counter_records == self.nrecords:
                              self.flagIsNewFile = True
                      self.buffer = numpy.array(dum)
                      return
                  def set_output(self):
                      '''
                      Storing data from buffer to dataOut object
                      '''
                      parameters = [None for __ in self.parameters]
                      for param, attr in list(self.oneDDict.items()):
                          x = self.parameters.index(param.lower())
                          setattr(self.dataOut, attr, self.buffer[0][x])
-                     for param, value in list(self.twoDDict.items()):
+                     for param, value in list(self.twoDDict.items()):
                          x = self.parameters.index(param.lower())
                          if self.ext == '.txt':
                              y = self.parameters.index(self.ind2DList[0].lower())
                              ranges = self.buffer[:,y]
-                             if self.ranges.size == ranges.size:
-                                 continue
+                             #if self.ranges.size == ranges.size:
+                             #    continue
                              index = numpy.where(numpy.in1d(self.ranges, ranges))[0]
                              dummy = numpy.zeros(self.ranges.shape) + numpy.nan
                              dummy[index] = self.buffer[:,x]
                          else:
                              dummy = self.buffer[x]
                          if isinstance(value, str):
                              if value not in self.ind2DList:
                                  setattr(self.dataOut, value, dummy.reshape(1,-1))
                          elif isinstance(value, list):
                              self.output[value[0]][value[1]] = dummy
                              parameters[value[1]] = param
                      for key, value in list(self.output.items()):
                          setattr(self.dataOut, key, numpy.array(value))
                      self.dataOut.parameters = [s for s in parameters if s]
                      self.dataOut.heightList = self.ranges
                      self.dataOut.utctime = (self.datatime - datetime.datetime(1970, 1, 1)).total_seconds()
                      self.dataOut.utctimeInit = self.dataOut.utctime
                      self.dataOut.paramInterval = min(self.intervals)
                      self.dataOut.useLocalTime = False
                      self.dataOut.flagNoData = False
                      self.dataOut.nrecords = self.nrecords
                      self.dataOut.flagDiscontinuousBlock = self.flagDiscontinuousBlock
                  def getData(self):
                      '''
                      Storing data from databuffer to dataOut object
                      '''
                      if self.flagNoMoreFiles:
                          self.dataOut.flagNoData = True
                          self.dataOut.error = 'No file left to process'
                          return 0
                      if not  self.readNextBlock():
                          self.dataOut.flagNoData = True
                          return 0
                      self.set_output()
                      return 1
+             @MPDecorator
              class MADWriter(Operation):
                  missing = -32767
-                 def __init__(self, **kwargs):
+                 def __init__(self):
-                     Operation.__init__(self, **kwargs)
+                     Operation.__init__(self)
                      self.dataOut = Parameters()
                      self.counter = 0
                      self.path = None
                      self.fp = None
                  def run(self, dataOut, path, oneDDict, ind2DList='[]', twoDDict='{}',
                          metadata='{}', format='cedar', **kwargs):
                      '''
                      Inputs:
                          path - path where files will be created
                          oneDDict - json of one-dimensional parameters in record where keys
                          are Madrigal codes (integers or mnemonics) and values the corresponding
                          dataOut attribute e.g: {
                              'gdlatr': 'lat',
                              'gdlonr': 'lon',
                              'gdlat2':'lat',
                              'glon2':'lon'}
                          ind2DList - list of independent spatial two-dimensional parameters e.g:
                              ['heighList']
                          twoDDict - json of two-dimensional parameters in record where keys
                          are Madrigal codes (integers or mnemonics) and values the corresponding
                          dataOut attribute if multidimensional array specify as tupple
                          ('attr', pos) e.g: {
                              'gdalt': 'heightList',
                              'vn1p2': ('data_output', 0),
                              'vn2p2': ('data_output', 1),
                              'vn3': ('data_output', 2),
                              'snl': ('data_SNR', 'db')
                              }
                          metadata - json of madrigal metadata (kinst, kindat, catalog and header)
                      '''
                      if not self.isConfig:
                          self.setup(path, oneDDict, ind2DList, twoDDict, metadata, format, **kwargs)
                          self.isConfig = True
                      self.dataOut = dataOut
                      self.putData()
-                     return
+                     return 1
                  def setup(self, path, oneDDict, ind2DList, twoDDict, metadata, format, **kwargs):
                      '''
                      Configure Operation
                      '''
                      self.path = path
                      self.blocks = kwargs.get('blocks', None)
                      self.counter = 0
                      self.oneDDict = load_json(oneDDict)
                      self.twoDDict = load_json(twoDDict)
                      self.ind2DList = load_json(ind2DList)
                      meta = load_json(metadata)
                      self.kinst = meta.get('kinst')
                      self.kindat = meta.get('kindat')
                      self.catalog = meta.get('catalog', DEF_CATALOG)
                      self.header = meta.get('header', DEF_HEADER)
                      if format == 'cedar':
                          self.ext = '.dat'
                          self.extra_args = {}
                      elif format == 'hdf5':
                          self.ext = '.hdf5'
                          self.extra_args = {'ind2DList': self.ind2DList}
                      self.keys = [k.lower() for k in self.twoDDict]
                      if 'range' in self.keys:
                          self.keys.remove('range')
                      if 'gdalt' in self.keys:
                          self.keys.remove('gdalt')
                  def setFile(self):
                      '''
                      Create new cedar file object
                      '''
                      self.mnemonic = MNEMONICS[self.kinst]   #TODO get mnemonic from madrigal
                      date = datetime.datetime.utcfromtimestamp(self.dataOut.utctime)
                      filename = '{}{}{}'.format(self.mnemonic,
                                                 date.strftime('%Y%m%d_%H%M%S'),
                                                 self.ext)
                      self.fullname = os.path.join(self.path, filename)
                      if os.path.isfile(self.fullname) :
                          log.warning(
                              'Destination file {} already exists, previous file deleted.'.format(
                                  self.fullname),
                              'MADWriter')
                          os.remove(self.fullname)
                      try:
                          log.success(
                              'Creating file: {}'.format(self.fullname),
                              'MADWriter')
                          self.fp = madrigal.cedar.MadrigalCedarFile(self.fullname, True)
                      except ValueError as e:
                          log.error(
                              'Impossible to create a cedar object with "madrigal.cedar.MadrigalCedarFile"',
                              'MADWriter')
                          return
                      return 1
                  def writeBlock(self):
                      '''
                      Add data records to cedar file taking data from oneDDict and twoDDict
                      attributes.
                      Allowed parameters in: parcodes.tab
                      '''
                      startTime = datetime.datetime.utcfromtimestamp(self.dataOut.utctime)
                      endTime = startTime + datetime.timedelta(seconds=self.dataOut.paramInterval)
                      heights = self.dataOut.heightList
                      if self.ext == '.dat':
                          for key, value in list(self.twoDDict.items()):
                              if isinstance(value, str):
                                  data = getattr(self.dataOut, value)
                                  invalid = numpy.isnan(data)
                                  data[invalid] = self.missing
                              elif isinstance(value, (tuple, list)):
                                  attr, key = value
                                  data = getattr(self.dataOut, attr)
                                  invalid = numpy.isnan(data)
                                  data[invalid] = self.missing
                      out = {}
                      for key, value in list(self.twoDDict.items()):
                          key = key.lower()
                          if isinstance(value, str):
                              if 'db' in value.lower():
                                  tmp = getattr(self.dataOut, value.replace('_db', ''))
                                  SNRavg = numpy.average(tmp, axis=0)
                                  tmp = 10*numpy.log10(SNRavg)
                              else:
                                  tmp = getattr(self.dataOut, value)
                              out[key] = tmp.flatten()
                          elif isinstance(value, (tuple, list)):
                              attr, x = value
                              data = getattr(self.dataOut, attr)
                              out[key] = data[int(x)]
                      a = numpy.array([out[k] for k in self.keys])
                      nrows = numpy.array([numpy.isnan(a[:, x]).all() for x in range(len(heights))])
                      index = numpy.where(nrows == False)[0]
                      rec = madrigal.cedar.MadrigalDataRecord(
                          self.kinst,
                          self.kindat,
                          startTime.year,
                          startTime.month,
                          startTime.day,
                          startTime.hour,
                          startTime.minute,
                          startTime.second,
                          startTime.microsecond/10000,
                          endTime.year,
                          endTime.month,
                          endTime.day,
                          endTime.hour,
                          endTime.minute,
                          endTime.second,
                          endTime.microsecond/10000,
                          list(self.oneDDict.keys()),
                          list(self.twoDDict.keys()),
                          len(index),
                          **self.extra_args
                      )
                      # Setting 1d values
                      for key in self.oneDDict:
                          rec.set1D(key, getattr(self.dataOut, self.oneDDict[key]))
                      # Setting 2d values
                      nrec = 0
                      for n in index:
                          for key in out:
                              rec.set2D(key, nrec, out[key][n])
                          nrec += 1
                      self.fp.append(rec)
                      if self.ext == '.hdf5' and self.counter % 500 == 0 and self.counter > 0:
                          self.fp.dump()
-                     if self.counter % 100 == 0 and self.counter > 0:
+                     if self.counter % 20 == 0 and self.counter > 0:
                          log.log(
                              'Writing {} records'.format(
                                  self.counter),
                              'MADWriter')
                  def setHeader(self):
                      '''
                      Create an add catalog and header to cedar file
                      '''
                      log.success('Closing file {}'.format(self.fullname), 'MADWriter')
                      if self.ext == '.dat':
                          self.fp.write()
                      else:
                          self.fp.dump()
                          self.fp.close()
                      header = madrigal.cedar.CatalogHeaderCreator(self.fullname)
                      header.createCatalog(**self.catalog)
                      header.createHeader(**self.header)
                      header.write()
                  def putData(self):
                      if self.dataOut.flagNoData:
                          return 0
                      if self.dataOut.flagDiscontinuousBlock or self.counter == self.blocks:
                          if self.counter > 0:
                              self.setHeader()
                          self.counter = 0
                      if self.counter == 0:
                          self.setFile()
                      self.writeBlock()
                      self.counter += 1
                  def close(self):
                      if self.counter > 0:
                          self.setHeader()
  No newline at end of file

schainpy/model/proc/jroproc_base.py +11 -5

              '''
              Updated for multiprocessing
              Author : Sergio Cortez
              Jan 2018
              Abstract:
                  Base class for processing units and operations. A decorator provides multiprocessing features and interconnect the processes created.
                  The argument (kwargs) sent from the controller is parsed and filtered via the decorator for each processing unit or operation instantiated.
                  The decorator handle also the methods inside the processing unit to be called from the main script (not as operations) (OPERATION -> type ='self').
              Based on:
                  $Author: murco $
                  $Id: jroproc_base.py 1 2012-11-12 18:56:07Z murco $
              '''
              import inspect
              import zmq
              import time
              import pickle
              import os
              from multiprocessing import Process
              from zmq.utils.monitor import recv_monitor_message
              from schainpy.utils import log
              class ProcessingUnit(object):
                  """
                  Update - Jan 2018 - MULTIPROCESSING
                  All the "call" methods present in the previous base were removed.
                  The majority of operations are independant processes, thus
                  the decorator is in charge of communicate the operation processes
                  with the proccessing unit via IPC.
                  The constructor does not receive any argument. The remaining methods
                  are related with the operations to execute.
                  """
                  def __init__(self):
                      self.dataIn = None
                      self.dataOut = None
                      self.isConfig = False
                      self.operations = []
                      self.plots = []
                  def getAllowedArgs(self):
                      if hasattr(self, '__attrs__'):
                          return self.__attrs__
                      else:
                          return inspect.getargspec(self.run).args
                  def addOperation(self, conf, operation):
                      """
                      This method is used in the controller, and update the dictionary containing the operations to execute. The dict
                      posses the id of the operation process (IPC purposes)
                          Agrega un objeto del tipo "Operation" (opObj) a la lista de objetos "self.objectList" y retorna el
                          identificador asociado a este objeto.
                          Input:
                              object    :    objeto de la clase "Operation"
                          Return:
                              objId    :    identificador del objeto, necesario para comunicar con master(procUnit)
                      """
                      self.operations.append(
                          (operation, conf.type, conf.id, conf.getKwargs()))
                      if 'plot' in self.name.lower():
                          self.plots.append(operation.CODE)
                  def getOperationObj(self, objId):
                      if objId not in list(self.operations.keys()):
                          return None
                      return self.operations[objId]
                  def operation(self, **kwargs):
                      """
                      Operacion directa sobre la data (dataOut.data). Es necesario actualizar los valores de los
                      atributos del objeto dataOut
                      Input:
                          **kwargs    :    Diccionario de argumentos de la funcion a ejecutar
                      """
                      raise NotImplementedError
                  def setup(self):
                      raise NotImplementedError
                  def run(self):
                      raise NotImplementedError
                  def close(self):
                      return
              class Operation(object):
                  """
                  Update - Jan 2018 - MULTIPROCESSING
                  Most of the methods remained the same. The decorator parse the arguments and executed the run() method for each process.
                  The constructor doe snot receive any argument, neither the baseclass.
                      Clase base para definir las operaciones adicionales que se pueden agregar a la clase ProcessingUnit
                      y necesiten acumular informacion previa de los datos a procesar. De preferencia usar un buffer de
                      acumulacion dentro de esta clase
                      Ejemplo: Integraciones coherentes, necesita la informacion previa de los n perfiles anteriores (bufffer)
                  """
                  def __init__(self):
                      self.id = None
                      self.isConfig = False
                      if not hasattr(self, 'name'):
                          self.name = self.__class__.__name__
                  def getAllowedArgs(self):
                      if hasattr(self, '__attrs__'):
                          return self.__attrs__
                      else:
                          return inspect.getargspec(self.run).args
                  def setup(self):
                      self.isConfig = True
                      raise NotImplementedError
                  def run(self, dataIn, **kwargs):
                      """
                      Realiza las operaciones necesarias sobre la dataIn.data y actualiza los
                      atributos del objeto dataIn.
                      Input:
                          dataIn    :    objeto del tipo JROData
                      Return:
                          None
                      Affected:
                          __buffer    :    buffer de recepcion de datos.
                      """
                      if not self.isConfig:
                          self.setup(**kwargs)
                      raise NotImplementedError
                  def close(self):
                      return
              def MPDecorator(BaseClass):
                  """
                  Multiprocessing class decorator
                  This function add multiprocessing features to a BaseClass. Also, it handle
                  the communication beetween processes (readers, procUnits and operations).
                  """
                  class MPClass(BaseClass, Process):
                      def __init__(self, *args, **kwargs):
                          super(MPClass, self).__init__()
                          Process.__init__(self)
                          self.operationKwargs = {}
                          self.args = args
                          self.kwargs = kwargs
                          self.sender = None
                          self.receiver = None
                          self.name = BaseClass.__name__
                          if 'plot' in self.name.lower() and not self.name.endswith('_'):
                              self.name = '{}{}'.format(self.CODE.upper(), 'Plot')
                          self.start_time = time.time()
                          if len(self.args) is 3:
                              self.typeProc = "ProcUnit"
                              self.id = args[0]
                              self.inputId = args[1]
                              self.project_id = args[2]
                          elif len(self.args) is 2:
                              self.id = args[0]
                              self.inputId = args[0]
                              self.project_id = args[1]
                              self.typeProc = "Operation"
                      def subscribe(self):
                          '''
                          This function create a socket to receive objects from the
                          topic `inputId`.
                          '''
                          c = zmq.Context()
                          self.receiver = c.socket(zmq.SUB)
                          self.receiver.connect(
                              'ipc:///tmp/schain/{}_pub'.format(self.project_id))
                          self.receiver.setsockopt(zmq.SUBSCRIBE, self.inputId.encode())
                      def listen(self):
                          '''
                          This function waits for objects and deserialize using pickle
                          '''
                          data = pickle.loads(self.receiver.recv_multipart()[1])
                          return data
                      def set_publisher(self):
                          '''
                          This function create a socket for publishing purposes.
                          '''
                          time.sleep(1)
                          c = zmq.Context()
                          self.sender = c.socket(zmq.PUB)
                          self.sender.connect(
                              'ipc:///tmp/schain/{}_sub'.format(self.project_id))
                      def publish(self, data, id):
                          '''
                          This function publish an object, to a specific topic.
                          '''
                          self.sender.send_multipart([str(id).encode(), pickle.dumps(data)])
                      def runReader(self):
                          '''
                          Run fuction for read units
                          '''
                          while True:
                              BaseClass.run(self, **self.kwargs)
                              for op, optype, opId, kwargs in self.operations:
                                  if optype == 'self' and not self.dataOut.flagNoData:
                                      op(**kwargs)
                                  elif optype == 'other' and not self.dataOut.flagNoData:
                                      self.dataOut = op.run(self.dataOut, **self.kwargs)
                                  elif optype == 'external':
                                      self.publish(self.dataOut, opId)
                              if self.dataOut.flagNoData and not self.dataOut.error:
                                  continue
                              self.publish(self.dataOut, self.id)
                              if self.dataOut.error:
                                  log.error(self.dataOut.error, self.name)
                                  # self.sender.send_multipart([str(self.project_id).encode(), 'end'.encode()])
                                  break
                          time.sleep(1)
                      def runProc(self):
                          '''
                          Run function for proccessing units
                          '''
                          while True:
                              self.dataIn = self.listen()
                              if self.dataIn.flagNoData and self.dataIn.error is None:
                                  continue
                              BaseClass.run(self, **self.kwargs)
                              if self.dataIn.error:
                                  self.dataOut.error = self.dataIn.error
-                                 self.dataOut.flagNoData = True
+                                 self.dataOut.flagNoData = True
                              for op, optype, opId, kwargs in self.operations:
                                  if optype == 'self' and not self.dataOut.flagNoData:
                                      op(**kwargs)
                                  elif optype == 'other' and not self.dataOut.flagNoData:
                                      self.dataOut = op.run(self.dataOut, **kwargs)
-                                 elif optype == 'external' and not self.dataOut.flagNoData:
-                                     if not self.dataOut.flagNoData or self.dataOut.error:
-                                         self.publish(self.dataOut, opId)
+                                 elif optype == 'external' and not self.dataOut.flagNoData:
+                                     self.publish(self.dataOut, opId)
                              if not self.dataOut.flagNoData or self.dataOut.error:
                                  self.publish(self.dataOut, self.id)
+                                 for op, optype, opId, kwargs in self.operations:
+                                     if optype == 'self' and self.dataOut.error:
+                                         op(**kwargs)
+                                     elif optype == 'other' and self.dataOut.error:
+                                         self.dataOut = op.run(self.dataOut, **kwargs)
+                                     elif optype == 'external' and self.dataOut.error:
+                                         self.publish(self.dataOut, opId)
                              if self.dataIn.error:
                                  break
                          time.sleep(1)
                      def runOp(self):
                          '''
                          Run function for external operations (this operations just receive data
                          ex: plots, writers, publishers)
                          '''
                          while True:
                              dataOut = self.listen()
                              BaseClass.run(self, dataOut, **self.kwargs)
                              if dataOut.error:
                                  break
                          time.sleep(1)
                      def run(self):
                          if self.typeProc is "ProcUnit":
                              if self.inputId is not None:
                                  self.subscribe()
                              self.set_publisher()
                              if 'Reader' not in BaseClass.__name__:
                                  self.runProc()
                              else:
                                  self.runReader()
                          elif self.typeProc is "Operation":
                              self.subscribe()
                              self.runOp()
                          else:
                              raise ValueError("Unknown type")
                          self.close()
                      def event_monitor(self, monitor):
                          events = {}
                          for name in dir(zmq):
                              if name.startswith('EVENT_'):
                                  value = getattr(zmq, name)
                                  events[value] = name
                          while monitor.poll():
                              evt = recv_monitor_message(monitor)
                              if evt['event'] == 32:
                                  self.connections += 1
                              if evt['event'] == 512:
                                  pass
                              evt.update({'description': events[evt['event']]})
                              if evt['event'] == zmq.EVENT_MONITOR_STOPPED:
                                  break
                          monitor.close()
                          print('event monitor thread done!')
                      def close(self):
                          BaseClass.close(self)
                          if self.sender:
                              self.sender.close()
                          if self.receiver:
                              self.receiver.close()
                          log.success('Done...(Time:{:4.2f} secs)'.format(time.time()-self.start_time), self.name)
                  return MPClass

schainpy/model/proc/jroproc_parameters.py 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages