Skip to content

Commit

Permalink
Minor fixes
Browse files Browse the repository at this point in the history
  • Loading branch information
kstathou committed Dec 5, 2023
1 parent 5751859 commit 2c88fb9
Showing 1 changed file with 2 additions and 4 deletions.
6 changes: 2 additions & 4 deletions src/llm_stack/scripts/build_dataset_ner.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,6 @@
# Imports shared across functions
with image.run_inside():
import asyncio
import logging
import os

import pandas as pd
Expand Down Expand Up @@ -98,7 +97,6 @@ async def annotate_dataset_with_open_ai(
messages = [
system_message.to_prompt(),
user_message.to_prompt(text=tup.abstract),
# formatting_message,
]
tasks.append(
openai_llm.generate(
Expand Down Expand Up @@ -146,8 +144,8 @@ async def main(
local_data_path_ner_openai: str = "preprints_openai_ner.parquet",
) -> None:
"""Build an NER dataset using arXiv's papers and OpenAI's LLMs."""
logging.info("Fetching arXiv data...")
# Fetching the arXiv data
fetch_arxiv_data.remote(local_data_path=local_data_path_raw)

logging.info("NER with OpenAI...")
# NER with OpenAI
annotate_dataset_with_open_ai.remote(local_data_path=local_data_path_ner_openai)

0 comments on commit 2c88fb9

Please sign in to comment.