Skip to content

Commit

Permalink
feat: batch size as env variable and return metadata
Browse files Browse the repository at this point in the history
  • Loading branch information
tim-schultz committed Aug 14, 2024
1 parent 9f689e0 commit 46de20c
Show file tree
Hide file tree
Showing 4 changed files with 13 additions and 6 deletions.
6 changes: 3 additions & 3 deletions api/passport/api.py
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ class ScoreModel(Schema):

class DetailedScoreModel(Schema):
score: int
n_transactions: Optional[int]
num_transactions: Optional[int]
first_funder: Optional[str]
first_funder_amount: Optional[int]

Expand Down Expand Up @@ -103,7 +103,7 @@ async def fetch(session, url, data):
"data": {
"human_probability": -1,
"n_transactions": -1,
"error": "Error fetching model response",
"error": str(e),
}
}

Expand Down Expand Up @@ -185,7 +185,7 @@ async def handle_get_analysis(

ret.details.models[model] = DetailedScoreModel(
score=score,
n_transactions=num_transactions,
num_transactions=num_transactions,
first_funder=first_funder,
first_funder_amount=first_funder_amount,
)
Expand Down
2 changes: 1 addition & 1 deletion api/passport/test/test_analysis.py
Original file line number Diff line number Diff line change
Expand Up @@ -194,7 +194,7 @@ def test_handle_get_analysis_returns_additional_data(self, mock_fetch):
)

assert analysis.details.models["zksync"].score == 95
assert analysis.details.models["zksync"].n_transactions == 10
assert analysis.details.models["zksync"].num_transactions == 10
assert analysis.details.models["zksync"].first_funder == "funder"
assert analysis.details.models["zksync"].first_funder_amount == 1000

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@
from registry.admin import get_s3_client
from registry.models import BatchModelScoringRequest, BatchRequestStatus
from scorer.settings import (
BULK_MODEL_SCORE_BATCH_SIZE,
BULK_MODEL_SCORE_REQUESTS_RESULTS_FOLDER,
BULK_SCORE_REQUESTS_ADDRESS_LIST_FOLDER,
BULK_SCORE_REQUESTS_BUCKET_NAME,
Expand Down Expand Up @@ -99,7 +100,7 @@ def download_from_s3(self, s3_filename):
except Exception as e:
raise CommandError(f"Failed to download file from S3: {str(e)}")

def process_csv_in_batches(self, csv_data, batch_size=300):
def process_csv_in_batches(self, csv_data, batch_size=BULK_MODEL_SCORE_BATCH_SIZE):
while True:
batch = list(islice(csv_data, batch_size))
if not batch:
Expand Down Expand Up @@ -137,7 +138,12 @@ async def process_address(self, address, model_list):

details_dict = {
"models": {
model: {"score": score.score}
model: {
"score": score.score,
"num_transactions": score.num_transactions,
"first_funder": score.first_funder,
"first_funder_amount": score.first_funder_amount,
}
for model, score in analysis.details.models.items()
}
}
Expand Down
1 change: 1 addition & 0 deletions api/scorer/settings/base.py
Original file line number Diff line number Diff line change
Expand Up @@ -463,6 +463,7 @@
BULK_MODEL_SCORE_REQUESTS_RESULTS_FOLDER = env(
"BULK_MODEL_SCORE_REQUESTS_RESULTS_FOLDER", default="model-score-results"
)
BULK_MODEL_SCORE_BATCH_SIZE = env("BULK_MODEL_SCORE_BATCH_SIZE", default=50)
DATA_SCIENCE_API_KEY = env("DATA_SCIENCE_API_KEY", default="abc")

VERIFIER_URL = env("VERIFIER_URL", default="http://localhost:8001/verifier/verify")

0 comments on commit 46de20c

Please sign in to comment.