python:新しい概念の英語のテキストはhtmlに変わります


詳細
txt2htm.py

# -*- coding: utf-8 -*-
import os, sys
import glob

if len(sys.argv) ==2:
    pattern = sys.argv[1]
else:
    print 'usage: txt2htm.py *.txt '
    print 'generate ?????.htm '
    sys.exit(1)

for f1 in glob.glob(pattern):
    print f1
    fn,ext = os.path.splitext(f1)
    if ext != '.txt':
        print 'Error: %s is not txt file ' % f1
        sys.exit(4)
    
    headline ="""

  
  
           %s 
  

""" % (fn)
    audio ="""
  
""" % (fn)
    
    fp1 = open(f1,'r')
    f2  = fn +'.htm'
    fp2 = open(f2,'w')
    fp2.write(headline)
    ln =0
    for line in fp1:
        if len(line.strip()) ==0:
            continue
        ln +=1
        if ln ==1:
            alist = line.strip().split(' ',1)
            aline = '

'+alist[1]+'

' fp2.write(aline) else: if line.startswith(" "): fp2.write(audio) elif line.startswith("New Word"): aline = '


'+line fp2.write(aline) elif line.startswith("New word"): aline = '


'+line fp2.write(aline) elif line.startswith("Notes on"): aline = '


'+line fp2.write(aline) elif line.startswith(" "): aline = '


'+line fp2.write(aline) elif line.startswith(" "): break elif line.startswith("document.onclick"): break else: aline = '
'+line fp2.write(aline) # fp2.write("


") fp1.close() fp2.close() #