Skip to content

Commit

Permalink
notebooks
Browse files Browse the repository at this point in the history
  • Loading branch information
semio committed Sep 16, 2024
1 parent eea145b commit 88e0059
Showing 1 changed file with 40 additions and 0 deletions.
40 changes: 40 additions & 0 deletions automation-api/yival_experiments/notebooks/compare_evaluators.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,40 @@
import duckdb
import polars as pl


results = pl.read_parquet("../output/results.parquet")

results.columns

df = results.filter(pl.col("model_id").str.contains("llama"))


conn = duckdb.connect()


conn.query("select * from df")

q = """select
*
from
df
where
not (
llama3_evaluator_correctness = vertex_ai_evaluator_correctness
and gpt4_evaluator_correctness = vertex_ai_evaluator_correctness
and (
simple_evaluator_matching <> 0
and simple_evaluator_matching = gpt4_evaluator_correctness
)
)
and simple_evaluator_matching <> 0"""

diffs = conn.query(q)

conn.query("select count(*) from df")
conn.query("select count(*) from diffs")

diffs.to_csv("to_check.csv")

1281 / 30780

0 comments on commit 88e0059

Please sign in to comment.