python:新しい概念の英語のテキストはhtmlに変わります
詳細
txt2htm.py
txt2htm.py
# -*- coding: utf-8 -*-
import os, sys
import glob
if len(sys.argv) ==2:
pattern = sys.argv[1]
else:
print 'usage: txt2htm.py *.txt '
print 'generate ?????.htm '
sys.exit(1)
for f1 in glob.glob(pattern):
print f1
fn,ext = os.path.splitext(f1)
if ext != '.txt':
print 'Error: %s is not txt file ' % f1
sys.exit(4)
headline ="""
%s
""" % (fn)
audio ="""
""" % (fn)
fp1 = open(f1,'r')
f2 = fn +'.htm'
fp2 = open(f2,'w')
fp2.write(headline)
ln =0
for line in fp1:
if len(line.strip()) ==0:
continue
ln +=1
if ln ==1:
alist = line.strip().split(' ',1)
aline = ''+alist[1]+'
'
fp2.write(aline)
else:
if line.startswith(" "):
fp2.write(audio)
elif line.startswith("New Word"):
aline = '
'+line
fp2.write(aline)
elif line.startswith("New word"):
aline = '
'+line
fp2.write(aline)
elif line.startswith("Notes on"):
aline = '
'+line
fp2.write(aline)
elif line.startswith(" "):
aline = '
'+line
fp2.write(aline)
elif line.startswith(" "):
break
elif line.startswith("document.onclick"):
break
else:
aline = '
'+line
fp2.write(aline)
#
fp2.write("
")
fp1.close()
fp2.close()
#