Skip to content

Commit

Permalink
feat(scripts): add script to parse prompt books
Browse files Browse the repository at this point in the history
  • Loading branch information
ssube committed Jul 6, 2023
1 parent 1133321 commit de8105e
Showing 1 changed file with 34 additions and 0 deletions.
34 changes: 34 additions & 0 deletions api/scripts/parse-prompts.py
@@ -0,0 +1,34 @@
from typing import List
from argparse import ArgumentParser
from sys import argv
from collections import Counter
from json import dumps


def parse_args(args: List[str]):
parser = ArgumentParser(
prog="onnx-web prompt parser",
description="count phrase frequency in prompt books",
)
parser.add_argument("file", nargs="+", help="prompt files to parse")
return parser.parse_args(args)


def main():
args = parse_args(argv[1:])

lines: List[str] = []
for file in args.file:
with open(file, "r") as f:
lines.extend(f.readlines())

phrases = []
for line in lines:
phrases.extend([p.lower().strip() for p in line.split(",")])

count = Counter(phrases)
print(dumps(dict(count.most_common())))


if __name__ == "__main__":
main()

0 comments on commit de8105e

Please sign in to comment.