From 40c461f565e8c4928d388c47f77d11defe4a619d Mon Sep 17 00:00:00 2001 From: Michael Love <mlove@passcal.nmt.edu> Date: Thu, 16 Aug 2018 14:57:26 -0600 Subject: [PATCH] Compatibility & code cleanup. Updated for Python 2.7 & 3.6 compatibility. Code cleanup for PEP 8 standards. --- HISTORY.rst | 6 ++ docs/conf.py | 0 refscrub/__init__.py | 2 +- refscrub/refscrub.py | 239 +++++++++++++++++++++++++------------------ setup.cfg | 2 +- setup.py | 4 +- 6 files changed, 147 insertions(+), 106 deletions(-) mode change 100755 => 100644 docs/conf.py mode change 100755 => 100644 refscrub/refscrub.py diff --git a/HISTORY.rst b/HISTORY.rst index 158c12c..ffd258c 100644 --- a/HISTORY.rst +++ b/HISTORY.rst @@ -16,3 +16,9 @@ History ------------------ * Minor fixes of global variables + +2018.227 (2018-09-16) +------------------ + +* Python 2.7 & 3.6 compatiblity. +* Code cleanup to match PEP 8. diff --git a/docs/conf.py b/docs/conf.py old mode 100755 new mode 100644 diff --git a/refscrub/__init__.py b/refscrub/__init__.py index 384ebd4..efb2f2d 100644 --- a/refscrub/__init__.py +++ b/refscrub/__init__.py @@ -4,4 +4,4 @@ __author__ = """IRIS PASSCAL""" __email__ = 'software-support@passcal.nmt.edu' -__version__ = '2018.204' +__version__ = '2018.227' diff --git a/refscrub/refscrub.py b/refscrub/refscrub.py old mode 100755 new mode 100644 index ba46a85..3d0d7b1 --- a/refscrub/refscrub.py +++ b/refscrub/refscrub.py @@ -1,5 +1,5 @@ #!/usr/bin/env python -''' +""" Lloyd Carothers February 2011 Rewrite of original refscrub @@ -7,53 +7,65 @@ Rewrite of original refscrub Derick Hess July 2018 Minor fixes for new build system -''' -from __future__ import with_statement -USAGE = 'usage: %prog [options] infile1 [ infile2 ... infileN]' -#USAGE = '''Scans (default) or extracts good reftek packets from a REFTEK file or CF card.''' -PROG_VERSION = '2018.204' +Michael Love +August 2018 +Updates to work on both Python 2 & 3. +Code cleanup to match PEP 8. +""" +from __future__ import (print_function, with_statement) +from os.path import join, basename, getsize +import sys +import struct + +USAGE = 'usage: %prog [options] infile1 [ infile2 ... infileN]' +PROG_VERSION = '2018.227' VERBOSE = False EXTRACT = False SUMMARY_FILE = 'scrubsum.txt' +PREFIX = "" +INFILE = "" +FILESIZE = 0 +TABS = "\t\t\t\t" -tabs = "\t\t\t\t" -from os.path import join, basename, getsize -import sys -import struct - -class SN(): - def __init__(self, SN): +class SN: + def __init__(self, sn): global EXTRACT global PREFIX - self.SN = SN + self.sn = sn self.count = 0 self.dates = list() if EXTRACT: - self.outfh = open( PREFIX + '.' + SN +'.scrub.ref', 'ab') + self.outfh = open(PREFIX + '.' + sn + '.scrub.ref', 'ab') else: self.outfh = None + def look(self, year, day, hour): self.dates.append((year, day, hour)) self.count += 1 + def close_fh(self): if self.outfh is not None: self.outfh.close() + def __str__(self): self.dates = list(set(self.dates)) self.dates.sort() start = "%0.2d:%0.3d:%0.2d" % (self.dates[0]) - end = "%0.2d:%0.3d:%0.2d" % (self.dates[-1]) - return "%7s: %s -- %s : %12d\n" % (self.SN , start , end, self.count ) + end = "%0.2d:%0.3d:%0.2d" % (self.dates[-1]) + return "%7s: %s -- %s : %12d\n" % (self.sn, start, end, self.count) + class SNseen(dict): def look(self, sn, year, day, hour): - ret = self.setdefault(sn,SN(sn) ) - ret.look( year, day, hour) + ret = self.setdefault(sn, SN(sn)) + ret.look(year, day, hour) + def close_fhs(self): for sn in self.values(): sn.close_fh() + def __str__(self): s = " SN: YR:DAY:HR -- YR:DAY:HR : %12s\n" % 'Good Packets' for sn in self.values(): @@ -61,122 +73,142 @@ class SNseen(dict): return s -##class SNseen(dict): -## def __init__(self): -## self.outfiledict = dict() -## def look(self, SN, year, day, hour): -## ret = self.setdefault(SN, list()) -## #make a file for a new seen SN -## if EXTRACT and not self.outfiledict.has_key(SN) : -## self.outfiledict[SN] = open( PREFIX + '.' + SN +'.scrub.ref', 'ab') -## if (year, day, hour) not in ret: -## self[SN].append((year, day, hour)) -## def close_fhs(self): -## for fh in self.outfiledict.values(): -## fh.close() -## def __str__(self): -## s = " SN: YR:DAY:HR -- YR:DAY:HR\n" -## for sn in self.keys(): -## dates = self[sn] -## dates.sort() -## start = "%0.2d:%0.3d:%0.2d" % (dates[0]) -## end = "%0.2d:%0.3d:%0.2d" % (dates[-1]) -## s += "%7s: %s -- %s\n" % (sn , start , end ) -## return s +# class SNseen(dict): +# def __init__(self): +# self.outfiledict = dict() +# def look(self, SN, year, day, hour): +# ret = self.setdefault(SN, list()) +# #make a file for a new seen SN +# if EXTRACT and not self.outfiledict.has_key(SN) : +# self.outfiledict[SN] = open( PREFIX + '.' + SN +'.scrub.ref', 'ab') +# if (year, day, hour) not in ret: +# self[SN].append((year, day, hour)) +# def close_fhs(self): +# for fh in self.outfiledict.values(): +# fh.close() +# def __str__(self): +# s = " SN: YR:DAY:HR -- YR:DAY:HR\n" +# for sn in self.keys(): +# dates = self[sn] +# dates.sort() +# start = "%0.2d:%0.3d:%0.2d" % (dates[0]) +# end = "%0.2d:%0.3d:%0.2d" % (dates[-1]) +# s += "%7s: %s -- %s\n" % (sn , start , end ) +# return s class RTPacket: RTstruct = struct.Struct('2c1B1B2B6B2B2B') - #packetHdrFmt = '2c1B1B2B6B2B2B' - packet_types = ( 'AD', 'CD', 'DS', 'DT', 'EH', 'ET', 'OM', 'SH', 'SC') - seen = SNseen() + # packetHdrFmt = '2c1B1B2B6B2B2B' + packet_types = ('AD', 'CD', 'DS', 'DT', 'EH', 'ET', 'OM', 'SH', 'SC') + seen = SNseen() goodpkts = 0 IOErrorCount = 0 + def __init__(self, data): self.data = data self.valid = None + self.timestring = None + self.ptype = None + self.expnum = None + self.year = None + self.sn = None + self.day = None + self.hour = None + self.min = None + self.sec = None + self.millisec = None + self.bytecount = None + self.sequence = None + def __str__(self): self.settimestring() s = "%(sequence)s %(ptype)s %(sn)s %(timestring)s" % self.__dict__ return s + def write(self): outfh = RTPacket.seen[self.sn].outfh - #outfh = RTPacket.seen.outfiledict[self.sn] + # outfh = RTPacket.seen.outfiledict[self.sn] try: outfh.write(self.data) - except Exception, e: - print "Failed to write extracted data to %s" % outfh.filename - print e + except Exception as e: + print("Failed to write extracted data to %s" % outfh.filename) + print(e) + def settimestring(self): - self.timestring = "%(year)0.2d:%(day)0.3d:%(hour)0.2d:%(min)0.2d:%(sec)0.2d.%(millisec)0.3d" % self.__dict__ + self.timestring = "%(year)0.2d:%(day)0.3d:%(hour)0.2d:%(min)0.2d:%(sec)0.2d.%(millisec)0.3d" % self.__dict__ + def isvalid(self): - ''' + """ Returns True if a valid reftek packet (headers parse well and are valid) Also populates the objects attributes SN, time, etc. - ''' + """ global VERBOSE try: tup = RTPacket.RTstruct.unpack(self.data[:16]) - #tup = unpack( self.packetHdrFmt, self.data[:16]) + # tup = unpack( self.packetHdrFmt, self.data[:16]) self.ptype = tup[0] + tup[1] assert self.ptype in self.packet_types, "BAD packet type" self.expnum = int("%0.2X" % tup[2]) - self.year = int("%0.2X" %tup[3]) - self.sn = "%0.2X%0.2X" % (tup[4] , tup[5] ) + self.year = int("%0.2X" % tup[3]) + self.sn = "%0.2X%0.2X" % (tup[4], tup[5]) assert '9001' <= self.sn, "BAD SN" - assert self.sn <= 'FFFF' , "BAD SN" + assert self.sn <= 'FFFF', "BAD SN" time = "%0.2X%0.2X%0.2X%0.2X%0.2X%0.2X" % tup[6:12] self.day, self.hour, self.min, self.sec, self.millisec = \ - int(time[:3]),int(time[3:5]),int(time[5:7]),int(time[7:9]),int(time[9:]) + int(time[:3]), int(time[3:5]), int(time[5:7]), int(time[7:9]), int(time[9:]) assert self.day <= 366, "BAD TIME" - assert self.hour <=24, "BAD TIME" + assert self.hour <= 24, "BAD TIME" assert self.min <= 60, "BAD TIME" - assert self.sec <=80, "BAD TIME" - assert self.millisec <=1000, "BAD TIME" + assert self.sec <= 80, "BAD TIME" + assert self.millisec <= 1000, "BAD TIME" self.bytecount = int("%0.2X%0.2X" % tup[12:14]) assert self.bytecount >= 24, "BAD byte count" assert self.bytecount <= 1024, "BAD bytecount" self.sequence = int("%0.2X%0.2X" % tup[14:16]) - #not a valid packet - except Exception , e: + # not a valid packet + except Exception as e: if VERBOSE: - print tabs +"Not a valid REFTEK packet" - print tabs + str(e) + print(TABS + "Not a valid REFTEK packet") + print(TABS + str(e)) self.valid = False return False - #parsed well :: valid packet + # parsed well :: valid packet else: self.valid = True RTPacket.seen.look(self.sn, self.year, self.day, self.hour) - RTPacket.goodpkts +=1 + RTPacket.goodpkts += 1 return True -def readfile(infile): + +def readfile(filename): ticker = 1 - #speedup local vars + # speedup local vars global VERBOSE global EXTRACT - tell = infile.tell - read = infile.read - seek = infile.seek + tell = filename.tell + read = filename.read + seek = filename.seek while True: ticker += 1 if VERBOSE is False and ticker == 10000: - print summary() + print(summary()) ticker = 1 - if VERBOSE: print "OFFSET: %12d" % tell() + if VERBOSE: + print("OFFSET: %12d" % tell()) # often disk wont read try: buffer = read(1024) except IOError: - print tabs + "IOError on read" - print tabs + "Skipping 1MB.." + print(TABS + "IOError on read") + print(TABS + "Skipping 1MB..") RTPacket.IOErrorCount += 1 - seek(1024*1024, 1) + seek(1024 * 1024, 1) continue - #End of file + # End of file if len(buffer) < 1024: - if VERBOSE: print "Partial packet" + if VERBOSE: + print("Partial packet") break p = RTPacket(buffer) valid = p.isvalid() @@ -185,43 +217,48 @@ def readfile(infile): if EXTRACT: p.write() if VERBOSE: - print p - print "<<<<<<<" - #packet is bad + print(p) + print("<<<<<<<") + # packet is bad else: if VERBOSE: - print tabs + "NOT VALID" - print tabs + ">>>>>>>>" + print(TABS + "NOT VALID") + print(TABS + ">>>>>>>>") seek(-1023, 1) - print summary() - #commented out as when run with many files as input like a cf dir the closed fh's need to be written to and isn't smart enough to be opened - #RTPacket.seen.close_fhs() + print(summary()) + # commented out as when run with many files as input like a cf dir the closed fh's need to be written to and isn't + # smart enough to be opened RTPacket.seen.close_fhs() + def summary(): - global infile + global INFILE global FILESIZE - OFFSTRING = "%6s: %12d\n" - s = OFFSTRING % ( "OFFSET", infile.tell()) - s += OFFSTRING % ( "OF", FILESIZE) + offstring = "%6s: %12d\n" + s = offstring % ("OFFSET", INFILE.tell()) + s += offstring % ("OF", FILESIZE) s += "Good packets: %d = %8.2fMB\n" % (RTPacket.goodpkts, RTPacket.goodpkts / 1024.0) - s+= "IOErrors: %d\n" % (RTPacket.IOErrorCount) + s += "IOErrors: %d\n" % RTPacket.IOErrorCount s += str(RTPacket.seen) + '\n' return s + def main(): global VERBOSE global EXTRACT global PREFIX - global infile + global INFILE global FILESIZE + summaryfh = None from optparse import OptionParser parser = OptionParser(USAGE, version="%prog " + PROG_VERSION) parser.description = "infile can be a REFTEK file or a raw disk (/dev/disk1) of a CF card." parser.add_option('-v', '--verbose', dest="VERBOSE", action='store_true', default=False, help="Prints info about each packet, good or bad. This will increase runtime.") parser.add_option('-e', '--extract', dest='EXTRACT', action='store_true', default=False, - help='Writes good packets to files named infile.SNXX.scrub.ref OR PREFIX.SNXX.scrub.ref, if given, for each Serial Number found. If output file exists it will append. Be careful not to duplicate data by running more than once on the same file in the same dir.') + help='Writes good packets to files named infile.SNXX.scrub.ref OR PREFIX.SNXX.scrub.ref, ' + ' if given, for each Serial Number found. If output file exists it will append. Be careful ' + 'not to duplicate data by running more than once on the same file in the same dir.') parser.add_option('-p', '--prefix', dest='PREFIX', help='Prefix of output filename. Defaults to inputfilename') parser.add_option('-s', '--savesum', dest='SUMMARY', action='store_true', default=False, @@ -233,24 +270,22 @@ def main(): if options.SUMMARY: summaryfh = open(SUMMARY_FILE, 'a') for infilename in args: - print - "Processing: %s" % infilename + print("Processing: %s" % infilename) if not PREFIX: PREFIX = basename(infilename) - print - "Using prefix %s" % PREFIX + print("Using prefix %s" % PREFIX) FILESIZE = getsize(infilename) - with open(infilename) as infile: - # with open( infile.name + 'scrub.ref')) as outfile: + with open(infilename) as filename: + # with open( filename.name + 'scrub.ref')) as outfile: # import profile - # profile.run('readfile(infile)') - readfile(infile) + # profile.run('readfile(filename)') + readfile(filename) if options.SUMMARY: summaryfh.write(infilename + ', ' + PREFIX + '\n') summaryfh.write(summary()) - print - "----------------------------------------" + print("----------------------------------------") + if __name__ == '__main__': main() diff --git a/setup.cfg b/setup.cfg index 01be888..5e7c599 100644 --- a/setup.cfg +++ b/setup.cfg @@ -1,5 +1,5 @@ [bumpversion] -current_version = 2018.180 +current_version = 2018.227 commit = True tag = True diff --git a/setup.py b/setup.py index 194d54d..29be5b2 100644 --- a/setup.py +++ b/setup.py @@ -20,7 +20,7 @@ setup( 'Intended Audience :: Developers', 'License :: OSI Approved :: GNU General Public License v3 (GPLv3)', 'Natural Language :: English', - 'Programming Language :: Python :: 2.7', + 'Programming Language :: Python :: 3.6', ], description="Remove select packets from RT130 data", entry_points={ @@ -51,6 +51,6 @@ setup( packages=find_packages(include=['refscrub']), test_suite='tests', url='https://git.passcal.nmt.edu/passoft/refscrub', - version='2018.204', + version='2018.227', zip_safe=False, ) -- GitLab