annotate search/extract_all.py @ 9:d1b54241a731

rewrite meeting fetcher
author drewp@bigasterisk.com
date Wed, 10 Jul 2024 12:25:06 -0700
parents search/search_base.py@f23b21bd0fce
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
f23b21bd0fce apex search
drewp@bigasterisk.com
parents:
diff changeset
1 from typing import Iterable
f23b21bd0fce apex search
drewp@bigasterisk.com
parents:
diff changeset
2
9
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
3 import extract_agenda
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
4 import extract_pdf
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
5 from doc import Doc
8
f23b21bd0fce apex search
drewp@bigasterisk.com
parents:
diff changeset
6
f23b21bd0fce apex search
drewp@bigasterisk.com
parents:
diff changeset
7
f23b21bd0fce apex search
drewp@bigasterisk.com
parents:
diff changeset
8 def allDocs() -> Iterable[Doc]:
9
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
9 for mod in [
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
10 #extract_pdf,
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
11 extract_agenda
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
12 ]:
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
13 for src in mod.files():
d1b54241a731 rewrite meeting fetcher
drewp@bigasterisk.com
parents: 8
diff changeset
14 yield from mod.phrasesFromFile(src)