from pydantic import ValidationError from server.backend.schemas.pydantic import ExcelInfo, settings,Translit from server.backend.api.nomenclature import processing import re import datetime import re import datetime def report_date(df, date_format: str): row_text = " ".join(df.iloc[0].astype(str)) match = re.search(r"по\s+(\d{2}\.\d{2}\.\d{4})", row_text) if not match: raise ValueError("There is no date in ozon_purchase_handler") dt = datetime.datetime.strptime(match.group(1), "%d.%m.%Y") return dt.strftime(date_format) def process_sheet(df, real_arti:int, real_quantity:int, real_sum_1:int): df = df.iloc[2:].reset_index(drop=True) # выбор нужных столбцов ПО ПОЗИЦИИ df = df.iloc[:, [real_arti, real_quantity, real_sum_1]].copy().dropna() df = df[(df != 0).all(axis=1)] # сразу задаём нужные имена df.columns = ['arti', 'counts', 'price'] # нормализация df['arti'] = df['arti'].replace(Translit.TRANSLIT, regex=True) df['arti'] = df['arti'].astype(str).str.upper().str.extract(f'({settings.PATTERN})') df['price'] = df['price'].astype(float) df['counts'] = df['counts'].astype(int) #Группировка df = df.groupby('arti', as_index=False).agg({'counts': 'sum', 'price': 'sum'}) #groupping df = processing(df) #vlookup for ref_keys validated_rows, errors = [], [] for i, row in df.iterrows(): try: validated_rows.append(ExcelInfo(**row.to_dict())) except ValidationError as e: errors.append((i, e.errors())) if errors: raise Exception( "There are some errors with validation in Отчет о выкупленных товарах", errors ) return validated_rows def evaluating(dfs): validated_rows_1 = process_sheet(dfs["Отчёт о выкупленных товарах"], real_arti=3,real_quantity=10, real_sum_1=11) # номера столбцов от озона date=report_date(dfs["Отчёт о выкупленных товарах"], date_format=settings.TIMEFORMAT) return validated_rows_1, date