f=open('./work.txt', 'r')
p=re.compile(r'^[0-9]+\|\|[0-9]+\|\|[0-9]+')
buf=''
i=0
for v in f:
m=p.match(v)
if m:
if buf != '':
try: arr=analyzer(buf)
except: raise
if isinstance(arr, tuple) == True:
savemail(arr[0], arr[1], arr[2], arr[4], arr[5])
buf=v
continue
buf+=v
극히 단순한 형태의 자료처리...
자발적고난 (부제: 눈뜬쉑이들의 세상!!!)
요즘 다시 lucene을 가지고 놀고있어요..
오래전에 작업한 내용이라서 처음부터 다시 보려니 약간의 짜증이...
>>> import PyLucene
>>> dir(PyLucene.IndexReader)
['__class__', '__del__', '__delattr__', '__dict__', '__doc__', '__getattr__', '__getattribute__', '__hash__', '__init__', '__module__', '__new__', '__reduce__', '__reduce_ex__', '__repr__', '__setattr__', '__str__', '__swig_getmethods__', '__swig_setmethods__', '__weakref__', '_s', 'close', 'deleteTerm', 'docFreq', 'document', 'getCurrentVersion', 'hasDeletions', 'indexExists', 'isDeleted', 'isLocked', 'lastModified', 'maxDoc', 'numDocs', 'open', 'setNorm', 'termDocs', 'termPositions', 'terms', 'undeleteAll', 'unlock']
>>> directory = PyLucene.FSDirectory_getDirectory('doc-pylucene-indx',False)
>>> reader = PyLucene.IndexReader.open(directory)
>>> reader.numDocs()
499
>>> reader.deleteTerm(400)
>>> reader.numDocs()
498
>>> reader.isDeleted(400
... )
True
>>> reader.close()
>>> reader = PyLucene.IndexReader.open(directory)
>>> reader.numDocs()
498
>>>
Geek’s Blog is powered by Tattertools.com / Original WP theme by John Wrana / tattertools skin by yuno
