import time dayNames = {0:'Mon',1:'Tue',2:'Wed',3:'Thu', 4:'Fri',5:'Sat',6:'Sun'} monthNames = {1:'Jan',2:'Feb',3:'Mar',4:'Apr',5:'May',6:'Jun',7:'Jul',8:'Aug',9:'Sep',10:'Oct',11:'Nov',12:'Dec'} nameToNumber = {} lines = [] with open("C:\RawCallLogs.csv","r") as f: for line in f: fields = line.split(',') folder = fields[0].replace('\"','') if folder == 'Folder': continue number = fields[1].replace('\"','') name = fields[2].replace('\"','') rawtime = fields[3].replace('\"','') structTime = time.strptime(rawtime,'%m/%d/%Y %H:%M:%S') weekday = "Weekday" if (structTime.tm_wday >= 5): weekday = "Weekend" dayName = dayNames[structTime.tm_wday] month = monthNames[structTime.tm_mon] day = structTime.tm_mday year = structTime.tm_year evening = "Daytime" if structTime.tm_hour > 18: evening = "Evening" duration = int(fields[4].replace('\"','').replace('\n',''))/60.0 if number == '-1': name = 'Unknown' if name != "": if name not in nameToNumber: nameToNumber[name] = set([number]) else: nameToNumber[name].add(number) lines.append([folder,number,name,rawtime,duration,weekday,evening,dayName,month,day,year,structTime.tm_hour,structTime.tm_min]) print len(lines) def is08Number(number): return number.startswith('08') or number.startswith('0448') def isLandlineNumber(number): return number.startswith('02') or number.startswith('0442') def isMobile(number): return len(number) > 7 def isInternational(number): return number.startswith('0091') or number.startswith('+91') with open("C:\RawCallLogsOut.csv","w") as f: f.write('Folder,Number,Name,Raw time,Duration,Weekday(s),DayTime,DayofWeek,Month,Day,Year,Hour,Min,NumberType\n') for line in lines: if (line[2] == ''):# No name for name,numbers in nameToNumber.items(): for number in numbers: numberInLine = line[1][::-1][:6][::-1] numberInMap = number[::-1][:6][::-1] if numberInLine == numberInMap: line[2] = name break if (line[2] == ''): if is08Number(line[1]): line[2] = "Unknown 08 Number" elif isLandlineNumber(line[1]): line[2] = 'Unknown landline' elif isMobile(line[1]): line[2] = 'Unknown mobile' else: line[2] = 'Unknown' numberType = 'Unknown' if (is08Number(line[1])): numberType = "08 Number" elif isLandlineNumber(line[1]): numberType = "Landline" elif isInternational(line[1]): numberType = "International" elif isMobile(line[1]): numberType = "Mobile" f.write("%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s\n" % (line[0],line[1],line[2],line[3],line[4],line[5],line[6],line[7],\ line[8],line[9],line[10],line[11],line[12],numberType))
Thursday, December 09, 2010
Data conversion
Some data conversion
Wednesday, October 20, 2010
Python: Accessing https pages from behing an authenticating proxy server
from urllib2 import ProxyHandler, build_opener proxyMap = {'https': 'http://(user):(pass)@(proxyhost):(proxypass)/'} proxy = ProxyHandler(proxyMap) opener = build_opener(proxy) u = opener.open('https://somehttpspage') data = u.read() charset = u.info().getparam('charset') # Python 2 print 'CharSet %s' % charset print '------------------------------------------------------------------------' print data
Friday, April 16, 2010
Python script for creating video using images and adding audio
I am usng a python script for converting images into a vidoe (using Java JMF) and then adding the audio to the vidoe and converting it to an mp4 format so that I can play it on my phone.
''' Created on 15 Apr 2010 @author: viswanav ''' import glob, subprocess, os vlcLocation = "C:\Development\Apps\PortableApps\VLCPortable\App\\vlc\\vlc.exe" for g in glob.glob("C:\Development\Docs\Books\VideoCDs\*\PK*"): audioFile = "" for flvGlob in glob.glob(g + "\*\media\*.flv"): audioFile = flvGlob break; convertToMov = ["java","-cp","C:\Development\workspaces\Trials\JavaTrials\JMF\out\production\JMFTrial","JpegImagesToMovie", "-w", "400","-h","300","-f","15",g] #print convertToMov print "Convert to Mov File" subprocess.call(convertToMov) movFileLocation = "" for movFile in glob.glob(g + "\*.mov"): movFileLocation= movFile break stdoutCommand = "--sout=#transcode{vcodec=mp4v,vb=800,acodec=mp4a,ab=128,scale=1,channels=2,audio-sync}:std{access=file,mux=mp4,dst=\"%s.mp4\"}" % movFileLocation print stdoutCommand addAudioAndConverToMp4Command = [vlcLocation,"-I","dummy",movFileLocation,"--input-slave=\"%s\"" % audioFile,stdoutCommand,"vlc://quit"] print addAudioAndConverToMp4Command print "Creating mp4 file" subprocess.call(addAudioAndConverToMp4Command) deleteMovCommand = ["del",movFileLocation] print deleteMovCommand print "Deleting mov file" os.remove(movFileLocation)
Python application for downloading a book and converting to pdf
A similar application in python for downloading book images from the net and converting it to a pdf file, but this time using python
''' Created on 25 Mar 2010 ''' import httplib import os import sys from optparse import OptionParser import time, thread from reportlab.pdfgen import canvas from reportlab.lib.pagesizes import letter, A4 from reportlab.lib.units import cm, mm, inch, pica write = sys.stdout.write h = httplib.HTTPConnection('webproxy',8080) headers = {'Cookie':''} size = 1800 urltemplate = ' /%s/pages/%i.jpg?width=1800' books = ('isbn2','isbn1') maxPages = 10000 def downloadBookImages(folderLocation,isbn): bookLocation = folderLocation + "\\%s" % isbn print 'Downloading book to %s' % bookLocation #Check if the folder location exists if os.path.exists(bookLocation) == False: os.mkdir(bookLocation) # If not create the folder h = httplib.HTTPConnection('webproxy',8080) imageFilePathTemplate = bookLocation + "\\%i.jpg" # Loop through all the pages for the book and save the page for page in range(maxPages): # Create the image file path imageFilePath = imageFilePathTemplate % page; # Check if the file exists if os.path.exists(imageFilePath) == True: write('E%i ' % page) continue url = urltemplate % (isbn,page) h.request('GET', url,headers=headers) write('.') responce = h.getresponse() if responce.status == 401: print 'Not Authorized Book %s, the cookie has expired' % isbn break; data = responce.read() if len(data) < 1000: print 'End of book %s since the page size is too small : %i' % (isbn,len(data)) break f = open(imageFilePath,'wb') f.write(data) f.close() def pdfDirectory(outputPDFName, imageDirectory ): dirim = str(imageDirectory) output = str(outputPDFName) print 'Converting to pdf %s, images %s' % (output,dirim) width, height = A4 height, width = A4 c = canvas.Canvas(output, pagesize=A4) for root, dirs, files in os.walk(dirim): nopage = len(files) for name in range(nopage): #print name/nopage write('.') name = str(name) + ".jpg" filepath = os.path.join(root, name) #if filepath.endswith('20.jpg'): break c.drawImage(filepath, mm * 0.001 , mm * 0.001, height, width, preserveAspectRatio=False) ##c.showPage() c.save() print "PDF of Image directory created %s" % outputPDFName def threadExe(location,isbn): print 'Executing Thread for location %s book %s\n' % (location,isbn) for page in range(maxPages): print '%s Page - %i \n' % (isbn,page) time.sleep(10) def createOptionParser(): parser = OptionParser(usage="Usage: %prog [options]", version="%prog 1.0") parser.add_option("-i", "--isbn", dest="isbn", action='store', type='string') parser.add_option("-d", action="store_true", dest="download", help="Download the book images", default=False) parser.add_option("-c", action="store_true", dest="converToPdf", help="Convert images to pdf file", default=False) parser.add_option("-f", "--imageFolder", type="string", help="Image folder to download or to read from.") parser.add_option("-p", "--pdfOutputFolder", type="string", help="Pdf output folder.") return parser if __name__ == '__main__': parser = createOptionParser() (options, args) = parser.parse_args() if not options.isbn: parser.error("You have to specify the isbn book number") if options.download or options.converToPdf: if not options.imageFolder: parser.error("Specify the image folder") if options.download: downloadBookImages(options.imageFolder,options.isbn) if options.converToPdf: if not options.pdfOutputFolder: parser.error("Specify the pdf folder") print 'Converting to pdf %s, images %s' % (options.pdfOutputFolder,options.imageFolder) pdfDirectory(options.pdfOutputFolder + options.isbn + ".pdf" , options.imageFolder) else: print 'Specify if you would like to download or convert the book or both?' # # for book in books: # downloadBookImages('c:\\tmp',book) # # for book in books: # pdfDirectory('w:\\%s' % book , 'c:\\tmp\\%s.pdf' % book) #
Sunday, February 07, 2010
Extracting the audio from an flv file and creating a new flv with only audio
As a part of my studies I wanted to extract out only the audio from the flv file into a new flv file.
Here is what I did
I also wanted to convert all the files while taking a copy of the original file
The above command didnt exactly work since, it was overwriting the old file as it was being converted, so I used this one
ffmpeg man pages: http://swoolley.org/man.cgi/1/ffmpeg
Here is what I did
$ffmpeg -i input.flv -f flv -vn -acodec copy output.flv
I also wanted to convert all the files while taking a copy of the original file
$find . -name *.flv -exec cp '{}' '{}'.`date +%d.%m.%y`.original \; -exec ffmpeg -i '{}' -y -f flv -vn -acodec copy '{}' \;
The above command didnt exactly work since, it was overwriting the old file as it was being converted, so I used this one
$find . -name *.flv -exec cp '{}' '{}'.original \; -exec ffmpeg -i '{}'.original -y -f flv -vn -acodec copy '{}' \;
ffmpeg man pages: http://swoolley.org/man.cgi/1/ffmpeg
Subscribe to:
Posts (Atom)