1
0
Fork 0

feat(scripts): add script to parse prompt books

This commit is contained in:
Sean Sube 2023-07-05 23:05:00 -05:00
parent 1133321179
commit de8105ec60
Signed by: ssube
GPG Key ID: 3EED7B957D362AF1
1 changed files with 34 additions and 0 deletions

View File

@ -0,0 +1,34 @@
from typing import List
from argparse import ArgumentParser
from sys import argv
from collections import Counter
from json import dumps
def parse_args(args: List[str]):
parser = ArgumentParser(
prog="onnx-web prompt parser",
description="count phrase frequency in prompt books",
)
parser.add_argument("file", nargs="+", help="prompt files to parse")
return parser.parse_args(args)
def main():
args = parse_args(argv[1:])
lines: List[str] = []
for file in args.file:
with open(file, "r") as f:
lines.extend(f.readlines())
phrases = []
for line in lines:
phrases.extend([p.lower().strip() for p in line.split(",")])
count = Counter(phrases)
print(dumps(dict(count.most_common())))
if __name__ == "__main__":
main()