Test first batch matches (#53)

Summary:

Test Plan:
This commit is contained in:
Pedro Rodriguez 2025-02-13 10:05:08 -08:00 committed by GitHub
parent 9d907fed1c
commit 85c2f28f26
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
4 changed files with 53 additions and 0 deletions

View file

@ -25,6 +25,7 @@ def test_entropy_model():
row_num=0,
arrow_batch_size=100,
s3_profile=None,
file_format="arrow",
)
arrow_file = initial_state.build()
tokenizer_args = TokenizerArgs(