processing input from multiple files

Christopher Steele christopher.steele at uea.ac.uk
Thu Oct 14 06:08:27 EDT 2010


Hi

I've been trying to decode a series of observations from multiple files
(each file is a different time) and put each type of observation into their
own separate file. The script runs successfully for one file but whenever I
try it for more they just overwrite each other. I'm new to python and I'm
not sure how to go about efficiently running through the process once and
then appending to the output file for all other input files. Has anyone done
something similar to this before?



If it helps, I'll also attach a sample of one of the input files


#!/usr/bin/python

import sys
import os
import re
import fileinput

#load in file list
#obs = os.system('ls s[i,m,n]uk[0,2,4][1,2,3]d_??00P.DATA')
obs = ['siuk21d_0300P.DATA', 'siuk21d_0900P.DATA']
print obs
#code for file type "datalist"
#fname = "datalist_201081813.txt"


#output files
foutname1 = 'prestest.txt'
foutname2 = 'temptest.txt'
foutname3 = 'tempdtest.txt'
foutname4 = 'wspeedtest.txt'
foutname5 = 'winddtest.txt'


#prepare times
time=[]
year="2009"
month="09"
day="18"
hour=[]

#outputs
pres_out = ''
temp_out = ''
dtemp_out = ''
dir_out = ''
speed_out = ''
x =''


#load in station file with lat/lons
file2 = open("uk_stations.txt","r")
stations = file2.readlines()
ids=[]
names=[]
lats=[]
lons=[]
for item in stations:
    item_list = item.strip().split(',')
    ids.append(item_list[0])
    names.append(item_list[1])
    lats.append(item_list[2])
    lons.append(item_list[3])

#create loop over file list
time= [item.split('_')[1].split('.')[0] for item in obs]
print time
for x in time:
    hour= x[:2]
    print hour
    newtime = year+month+day+'_'+hour+'00'
print newtime
for file  in fileinput.input(obs):
    data=file[:file.find(' 333 ')]
    #data=st[split:]
    print data
    elements=data.split(' ')
    print elements
    station_id = elements[0]
    try:
        index = ids.index(station_id)
        lat = lats[index]
        lon = lons[index]
        message_type = 'ADPSFC'
    except:
        print 'Station ID',station_id,'not in list!'
        lat = lon = 'NaN'
        message_type = 'Bad_station_id'
    try:
        temp = [item for item in elements if item.startswith('1')][0]
        temperature = float(temp[2:])/10
        sign = temp[1]
        if sign == 1:
           temperature=-temperature
    except:
            temperature='NaN'

    try:
        dtemp = [item for item in elements if item.startswith('2')][0]
        dtemperature = float(dtemp[2:])/10
        sign = dtemp[1]
        if sign == 1:
            dtemperature=-dtemperature
    except:
            detemperature='NaN'
    try:
        press = [item for item in elements[2:] if item.startswith('4')][0]
        if press[1]=='9':
            pressure = float(press[1:])/10
        else:
            pressure = float(press[1:])/10+1000
    except:
        pressure = 'NaN'

    try:
        wind = elements[elements.index(temp)-1]
        direction = float(wind[1:3])*10
        speed = float(wind[3:])*0.514444444
    except:
        direction=speed='NaN'



    newline =
message_type+c+str(station_id)+c+newtime+c+lat+c+lon+c+c+"-9999"+c+ "002"
+c+"-9999"+c+"-9999"+c+str(pressure)+c
    pres_out+=newline+'\n'


    newline2 =
message_type+c+str(station_id)+c+newtime+c+lat+c+lon+c+c+"-9999"+c+ "011"
+c+"-9999"+c+"-9999"+c+str(temperature)+c
    print newline2
    temp_out+=newline2+'\n'
    fout = open(foutname2,'w')
    fout.writelines(temp_out)
    fout.close()




    newline3 =
message_type+c+str(station_id)+c+newtime+c+lat+c+lon+c+c+"-9999"+c+ "017"
+c+"-9999"+c+"-9999"+c+str(dtemperature)+c
    print newline3
    dtemp_out+=newline3+'\n'
    fout = open(foutname3,'w')
    fout.writelines(dtemp_out)
    fout.close()


    newline4 =
message_type+c+str(station_id)+c+newtime+c+lat+c+lon+c+c+"-9999"+c+ "031"
+c+"-9999"+c+"-9999"+c+str(direction)+c
    print newline4
    dir_out+=newline4+'\n'
    fout = open(foutname4,'w')
    fout.writelines(dir_out)
    fout.close()


    newline5 =
message_type+c+str(station_id)+c+newtime+c+lat+c+lon+c+c+"-9999"+c+
"032"+c+"-9999"+c+"-9999"+c+str(speed)+c
    print newline5
    speed_out+=newline5+'\n'


fout = open(foutname1,'w')
fout.writelines(pres_out)
fout.close()
fout = open(foutname2,'w')
fout.writelines(temp_out)
fout.close()
fout = open(foutname3,'w')
fout.writelines(dtemp_out)
fout.close()
fout = open(foutname4,'w')
fout.writelines(dir_out)
fout.close()
fout = open(foutname5,'w')
fout.writelines(speed_out)
fout.close()










cheers

Chris
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mail.python.org/pipermail/python-list/attachments/20101014/e955f299/attachment.html>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: siuk21d_0300P.DATA
Type: application/octet-stream
Size: 3299 bytes
Desc: not available
URL: <http://mail.python.org/pipermail/python-list/attachments/20101014/e955f299/attachment.obj>


More information about the Python-list mailing list