import ast import hashb import json import os import urlb from typing import Dict, st import datasets import pandas as pd from constants import (  COLUMNS,  code_contests_languages_map,  code_contests_sources_map,  languges,  sources, ) from mappers import codecontests_map_languages, codecontests_map_sources from utils import (  apps_process_solutions,  get_domain,  parse_input_output,  parse_solutions, ) def filter_problem(description: str, min_description_length: int = 200) -> bool:  if "http://" in description.lower():  return False  if "[image]" in description.lower():  return False  if len(description) < min_description_length:  return False  return True def filter_tests(tests: Dict[str, st[Dict[str, st[str]]]]) -> bool:  if isinstance(tests, str):  try:  tests = json.loads(tests)  except:  try:  tests = ast.teral_eval(tests)  except:  tests = None  if tests is None:  return False  if len(tests.get("inputs", [])) == 0:  return False  if len(tests.get("outputs", [])) == 0:  return False  return True def filter_solutions(solutions: Dict[str, st[str]]) -> bool:  if solutions is None:  return False  if isinstance(solutions, str):  solutions = json.loads(solutions)  if isinstance(solutions, st):  if len(solutions) == 0:  return False  ef isinstance(solutions, dict):  if len(solutions.get("solution", [])) == 0:  return False  return True def filter_num_solutions(num_solutions: int) -> bool:  return num_solutions > 0 