Skip to content

Commit

Permalink
issue #2; added looking for keyword field in pdf metadata
Browse files Browse the repository at this point in the history
  • Loading branch information
Tyler Danstrom committed Jul 6, 2017
1 parent 7c97a1c commit 8ab8568
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions bin/extractor.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,11 +28,11 @@ def main():
total_files = 0

with open(args.output_file, "w", encoding="utf-8") as csv_file:
csvfieldnames = ["title", "author", "creationDate", "subject", "filePath"]
csvfieldnames = ["title", "author", "creationDate", "subject", "keywords", "filePath"]
writer = csv.DictWriter(csv_file, fieldnames=csvfieldnames)
writer.writeheader()
for n_file in a_generator:
parsed = Parser(n_file, ['author', 'subject', 'title', 'creationDate'])
parsed = Parser(n_file, ['author', 'subject', 'keywords', 'title', 'creationDate'])
total_files += 1
info = parsed.get_metadata()
info["filePath"] = basename(n_file)
Expand Down

0 comments on commit 8ab8568

Please sign in to comment.