Spaces:
Sleeping
Sleeping
import gradio as gr | |
import re | |
import inspect | |
import numpy as np | |
import pandas as pd | |
import os | |
from datetime import datetime | |
from sentence_transformers import SentenceTransformer | |
from sentence_transformers.util import cos_sim | |
from sentence_transformers import CrossEncoder | |
# import mysql.connector | |
import psycopg2 | |
db_user = os.environ["DB_NAME"] | |
# mydb = mysql.connector.connect( | |
# host=os.environ["DB_HOST"], | |
# user=os.environ["DB_USER"], | |
# port=os.environ["DB_PORT"], | |
# password=os.environ["DB_PASSWORD"] | |
# ) | |
mydb = psycopg2.connect( | |
host=os.environ["DB_HOST"], | |
user=os.environ["DB_USER"], | |
port=os.environ["DB_PORT"], | |
database=os.environ["DB_NAME"], | |
password=os.environ["DB_PASSWORD"] | |
) | |
# df_sample = pd.read_sql(f"SELECT * FROM {db_user}.sample", mydb) | |
# df_bobot = pd.read_sql(f"SELECT * FROM {db_user}.bobot", mydb) | |
df_sample = pd.read_sql(f"SELECT * FROM sample", mydb) | |
df_bobot = pd.read_sql(f"SELECT * FROM bobot", mydb) | |
df_bobot['BOBOT'] = [float(x.replace(",",".")) for x in df_bobot['BOBOT']]#.astype(float) | |
df_bobot["JENIS_KENDARAAN"] = [x[:-2] + x[-1] if x[-2] == "." else x for x in df_bobot["JENIS_KENDARAAN"]] | |
dict_swdkllj = { | |
"A":3000, | |
"B":23000, | |
"C1":35000, | |
"C2":83000, | |
"DP":35000, | |
"DU":73000, | |
"EP":153000, | |
"EU":90000, | |
"F":163000 | |
} | |
def find_swdkllj(row): | |
cc = int(row["jumlah_cc"]) | |
nm = str(row["nm_jenis_kb"]).upper() | |
if nm in ["AMBULANCE", "DAMKAR", "MOBIL JENAZAH"]: | |
return "A" | |
if nm in ["ALAT BERAT"]: | |
return "B" | |
if nm in ["SEDAN", "JEEP", "MINIBUS"]: | |
return "DP" | |
if "SPD. MOTOR" in nm: | |
if cc <= 50: | |
return "A" | |
elif cc <= 250: | |
return "C1" | |
else: | |
return "C2" | |
if "PICK UP" in nm: | |
if cc <= 2400: | |
return "DP" | |
df_sample["gol"] = df_sample.apply(find_swdkllj, axis=1) | |
df_sample["pnbp_stnk"] = df_sample["nm_jenis_kb"].apply( | |
lambda x: 100000 if x == "SPD. MOTOR R2" else 200000 | |
) | |
df_sample["pnbp_tnkb"] = df_sample["nm_jenis_kb"].apply( | |
lambda x: 60000 if x == "SPD. MOTOR R2" else 100000 | |
) | |
codes = """001 - Vehicle Registration (New) | |
002 - Vehicle Registration Renewal | |
003 - Vehicle Ownership Transfer | |
004 - Vehicle De-registration | |
005 - Lost Registration Certificate Replacement | |
006 - Address Change Update | |
007 - Vehicle Data Correction | |
008 - Ownership Name Correction | |
009 - Vehicle Tax Payment | |
010 - Late Payment Fee Processing | |
011 - Vehicle Type/Specification Update | |
012 - BBNKB (Transfer Fee of Vehicle Ownership) | |
013 - STNK Issuance (Vehicle Registration Certificate) | |
014 - STNK Renewal | |
015 - Motor Vehicle Roadworthiness Inspection | |
016 - Plate Number Renewal | |
017 - Lost Plate Replacement | |
018 - Vehicle Export Registration | |
019 - Vehicle Import Registration | |
020 - Fleet Vehicle Registration | |
021 - Bulk Vehicle Registration Update | |
022 - Vehicle Insurance Assistance | |
023 - Vehicle Accident Reporting | |
024 - Vehicle Usage Change Declaration (e.g., personal to commercial) | |
025 - Legal Document Verification | |
026 - Ownership Transfer for Inherited Vehicle | |
027 - STNK Temporary Suspension | |
028 - Proof of Ownership Document Update | |
029 - Vehicle Ownership History Check | |
030 - Vehicle Tax Recalculation Request | |
031 - Tax Exemption Application (for special cases) | |
032 - Deceased Owner’s Vehicle Ownership Transfer""".split("\n") | |
undetected = "099 - Other/Undetected" | |
# codes = """001 - Pendaftaran Kendaraan (Baru) | |
# 002 - Pembaruan Pendaftaran Kendaraan | |
# 003 - Alih Kepemilikan Kendaraan | |
# 004 - Pembatalan Pendaftaran Kendaraan | |
# 005 - Penggantian Sertifikat Pendaftaran Kendaraan yang Hilang | |
# 006 - Pembaruan Perubahan Alamat | |
# 007 - Koreksi Data Kendaraan | |
# 008 - Koreksi Nama Kepemilikan | |
# 009 - Pembayaran Pajak Kendaraan | |
# 010 - Proses Denda Keterlambatan Pembayaran | |
# 011 - Pembaruan Jenis/Spesifikasi Kendaraan | |
# 012 - Pembayaran Pajak Kendaraan Melalui E-Samsat | |
# 013 - Penerbitan STNK (Sertifikat Pendaftaran Kendaraan) | |
# 014 - Pembaruan STNK | |
# 015 - Pemeriksaan Kelayakan Jalan Kendaraan Bermotor | |
# 016 - Pembaruan Nomor Plat Kendaraan | |
# 017 - Penggantian Plat yang Hilang | |
# 018 - Pendaftaran Ekspor Kendaraan | |
# 019 - Pendaftaran Impor Kendaraan | |
# 020 - Pendaftaran Kendaraan Armada | |
# 021 - Pembaruan Pendaftaran Kendaraan Massal | |
# 022 - Bantuan Asuransi Kendaraan | |
# 023 - Pelaporan Kecelakaan Kendaraan | |
# 024 - Deklarasi Perubahan Penggunaan Kendaraan (misalnya, pribadi ke komersial) | |
# 025 - Verifikasi Dokumen Hukum | |
# 026 - Alih Kepemilikan Kendaraan Warisan | |
# 027 - Penangguhan Sementara STNK | |
# 028 - Pembaruan Dokumen Bukti Kepemilikan | |
# 029 - Pemeriksaan Riwayat Kepemilikan Kendaraan | |
# 030 - Permintaan Perhitungan Ulang Pajak Kendaraan | |
# 031 - Permohonan Pembebasan Pajak (untuk kasus khusus) | |
# 032 - Alih Kepemilikan Kendaraan Pemilik yang Meninggal""".split("\n") | |
codes = """001 - Pendaftaran Kendaraan | |
002 - Pembaruan Data Kendaraan | |
003 - Alih Kepemilikan atau Balik Nama Kendaraan | |
004 - Pelaporan Dokumen atau Plat yang Hilang | |
005 - Pembayaran dan Pengelolaan Pajak Kendaraan | |
006 - Pemeriksaan dan Verifikasi Kendaraan | |
007 - Pendaftaran Kendaraan Ekspor, Impor, atau Armada | |
008 - Pelaporan dan Bantuan Terkait Kendaraan | |
009 - Penangguhan atau Deklarasi Perubahan Penggunaan Kendaraan""".split("\n") | |
codes = """003 - Alih Kepemilikan atau Balik Nama Kendaraan | |
005 - Pembayaran dan Pengelolaan Pajak Kendaraan""".split("\n") | |
# documents = """Vehicle Registration | |
# Vehicle Data Update | |
# Vehicle Ownership or Change of Name | |
# Reporting of Lost Documents or Plates | |
# Vehicle Tax Payment and Management | |
# Vehicle Inspection and Verification | |
# Registration of Export, Import, or Fleet Vehicles | |
# Reporting and Assistence of Vehicles Insurance | |
# Suspension or Declaration of Change of Vehicle Use""".split("\n") | |
# examples = [ | |
# {"code": "001", "examples": [ | |
# "Register a new vehicle", | |
# "Vehicle registration application", | |
# "Apply for vehicle registration", | |
# "Submit new vehicle registration", | |
# "New vehicle registration request" | |
# ]}, | |
# {"code": "002", "examples": [ | |
# "Update vehicle information", | |
# "Change details of a registered vehicle", | |
# "Submit updated vehicle data", | |
# "Request vehicle data update", | |
# "Modify vehicle registration information" | |
# ]}, | |
# {"code": "003", "examples": [ | |
# "Transfer vehicle ownership", | |
# "Apply for vehicle name change", | |
# "Request ownership transfer for a vehicle", | |
# "Submit vehicle ownership change", | |
# "Process vehicle title transfer" | |
# ]}, | |
# {"code": "004", "examples": [ | |
# "Report lost vehicle documents (STNK, BPKB, etc)", | |
# "Declare missing license plates", | |
# "File a report for lost vehicle papers", | |
# "Lost vehicle documents reporting", | |
# "Inform authorities about missing vehicle documents" | |
# ]}, | |
# {"code": "005", "examples": [ | |
# "Pay vehicle tax", | |
# "Manage vehicle tax payments", | |
# "Submit vehicle tax payment", | |
# "Request vehicle tax management services", | |
# "Complete annual vehicle tax" | |
# ]}, | |
# {"code": "006", "examples": [ | |
# "Conduct vehicle inspection", | |
# "Request vehicle verification check", | |
# "Submit vehicle for verification", | |
# "Schedule vehicle examination", | |
# "Apply for vehicle inspection and verification" | |
# ]}, | |
# {"code": "007", "examples": [ | |
# "Register an imported vehicle", | |
# "Submit registration for export vehicle", | |
# "Apply for fleet vehicle registration", | |
# "Register new vehicle for export or import", | |
# "Fleet vehicle registration application" | |
# ]}, | |
# {"code": "008", "examples": [ | |
# "Report vehicle-related issues", | |
# "Request assistance for a vehicle problem", | |
# "Submit report concerning a vehicle", | |
# "File for vehicle-related support", | |
# "Seek help with vehicle concerns" | |
# ]}, | |
# {"code": "009", "examples": [ | |
# "Suspend vehicle usage", | |
# "Declare change of vehicle usage purpose", | |
# "Request a hold on vehicle usage", | |
# "Submit application for vehicle usage change", | |
# "File for suspension of vehicle operations" | |
# ]} | |
# ] | |
examples = [ | |
{"code": "001", "examples": [ | |
"Daftarkan kendaraan baru", | |
"Pengajuan pendaftaran kendaraan", | |
"Ajukan pendaftaran kendaraan", | |
"Serahkan pendaftaran kendaraan baru", | |
"Permintaan pendaftaran kendaraan baru" | |
]}, | |
{"code": "002", "examples": [ | |
"Perbarui informasi kendaraan", | |
"Ubah detail kendaraan yang terdaftar", | |
"Ajukan pembaruan data kendaraan", | |
"Permintaan pembaruan data kendaraan", | |
"Modifikasi informasi pendaftaran kendaraan" | |
]}, | |
{"code": "003", "examples": [ | |
"Alihkan kepemilikan kendaraan", | |
"Ajukan perubahan nama kendaraan", | |
"Permintaan pengalihan kepemilikan kendaraan", | |
"Serahkan perubahan kepemilikan kendaraan", | |
"Proses alih nama kendaraan" | |
]}, | |
{"code": "004", "examples": [ | |
"Laporkan dokumen kendaraan hilang (STNK, BPKB, dll)", | |
"Nyatakan plat nomor hilang", | |
"Ajukan laporan dokumen kendaraan hilang", | |
"Pelaporan dokumen kendaraan yang hilang", | |
"Informasikan pihak berwenang tentang dokumen kendaraan yang hilang" | |
]}, | |
{"code": "005", "examples": [ | |
"Bayar pajak kendaraan", | |
"Kelola pembayaran pajak kendaraan", | |
"Ajukan pembayaran pajak kendaraan", | |
"Permintaan layanan manajemen pajak kendaraan", | |
"Selesaikan pajak tahunan kendaraan" | |
]}, | |
{"code": "006", "examples": [ | |
"Lakukan pemeriksaan kendaraan", | |
"Ajukan pemeriksaan verifikasi kendaraan", | |
"Serahkan kendaraan untuk verifikasi", | |
"Jadwalkan pemeriksaan kendaraan", | |
"Ajukan inspeksi dan verifikasi kendaraan" | |
]}, | |
{"code": "007", "examples": [ | |
"Daftarkan kendaraan impor", | |
"Ajukan pendaftaran kendaraan ekspor", | |
"Ajukan pendaftaran kendaraan armada", | |
"Daftarkan kendaraan baru untuk ekspor atau impor", | |
"Pengajuan pendaftaran kendaraan armada" | |
]}, | |
{"code": "008", "examples": [ | |
"Laporkan masalah terkait kendaraan", | |
"Permintaan bantuan untuk masalah kendaraan", | |
"Ajukan laporan mengenai kendaraan", | |
"Ajukan dukungan terkait kendaraan", | |
"Cari bantuan terkait permasalahan kendaraan" | |
]}, | |
{"code": "009", "examples": [ | |
"Tangguhkan penggunaan kendaraan", | |
"Nyatakan perubahan tujuan penggunaan kendaraan", | |
"Ajukan penangguhan penggunaan kendaraan", | |
"Ajukan perubahan penggunaan kendaraan", | |
"Ajukan penangguhan operasional kendaraan" | |
]} | |
] | |
# examples = [ | |
# {"code": "001", "examples": [ | |
# codes[0][6:], | |
# "Pendaftaran kendaraan", | |
# "Daftar baru untuk plat kendaraan", | |
# "Registrasi kendaraan" | |
# ]}, | |
# {"code": "002", "examples": [ | |
# codes[1][6:], | |
# "Perubahan alamat, warna, komponnen kendaraan", | |
# "Update informasi kendaraan", | |
# "Perubahan data pemilik", | |
# ]}, | |
# {"code": "003", "examples": [ | |
# codes[2][6:], | |
# "Alih kepemilikan kendaraan", | |
# "Balik nama untuk kendaraan", | |
# "Perubahan pemilik pada kendaraan" | |
# ]}, | |
# {"code": "004", "examples": [ | |
# codes[3][6:], | |
# "Laporan kehilangan dokumen kendaraan", | |
# "Hilangnya plat nomor kendaraan", | |
# "Dokumen kendaraan dilaporkan hilang" | |
# ]}, | |
# {"code": "005", "examples": [ | |
# codes[4][6:], | |
# "Pembayaran pajak kendaraan", | |
# "Kelola pajak tahunan kendaraan", | |
# "Pajak kendaraan" | |
# ]}, | |
# {"code": "006", "examples": [ | |
# codes[5][6:], | |
# "Pemeriksaan fisik kendaraan", | |
# "Verifikasi kendaraan", | |
# "Cek kondisi kendaraan" | |
# ]}, | |
# {"code": "007", "examples": [ | |
# codes[6][6:], | |
# "Pendaftaran kendaraan impor", | |
# "Registrasi armada baru", | |
# "Kendaraan ekspor didaftarkan" | |
# ]}, | |
# {"code": "008", "examples": [ | |
# codes[7][6:], | |
# "Pelaporan terkait kendaraan", | |
# "Bantuan atau Asuransi atas kendaraan", | |
# "Laporkan masalah kendaraan" | |
# ]}, | |
# {"code": "009", "examples": [ | |
# codes[8][6:], | |
# "Penangguhan penggunaan kendaraan", | |
# "Deklarasi perubahan fungsi kendaraan", | |
# "Penggunaan baru untuk kendaraan" | |
# ]} | |
# ] | |
vehicle_tax_info = { | |
"B 1234 BCA": { | |
"no_rangka": "1237191234", | |
"type": "SUV", | |
"tanggal": "23 Desember 2024", | |
"status": "Belum Bayar", | |
"harga_jual": 500_000_000 # In Rupiah | |
}, | |
"B 5678 XYZ": { | |
"no_rangka": "9876543210", | |
"type": "Sedan", | |
"tanggal": "15 Januari 2025", | |
"status": "Belum Bayar", | |
"harga_jual": 375_800_000 # In Rupiah | |
}, | |
"D 3456 DEF": { | |
"no_rangka": "4561237890", | |
"type": "MPV", | |
"tanggal": "10 Februari 2025", | |
"status": "Sudah Bayar", | |
"harga_jual": 400_000_000 # In Rupiah | |
} | |
} | |
# Table for detail calculations (perhitungan) | |
detail_perhitungan = { | |
"001": { | |
"name": "Pendaftaran Kendaraan", | |
"formula": lambda harga_jual: harga_jual * 0.1, | |
# Example formula: 10% of harga_jual | |
}, | |
"002": { | |
"name": "Pembaruan Data Kendaraan", | |
"formula": lambda harga_jual: harga_jual * 0.05, | |
# Example formula: 5% of harga_jual | |
}, | |
"003": { | |
"name": "Alih Kepemilikan (Balik Nama) Kendaraan", | |
"formula": lambda harga_jual: harga_jual * 0.1, | |
# Example formula: 10% of harga_jual | |
}, | |
"004": { | |
"name": "Penggantian Dokumen atau Plat yang Hilang", | |
"formula": lambda harga_jual: harga_jual * 0.03, | |
# Example formula: 3% of harga_jual | |
}, | |
"005": { | |
"name": "Pembayaran dan Pengelolaan Pajak Kendaraan", | |
"formula": lambda harga_jual: harga_jual * 0.12, | |
# Example formula: 12% of harga_jual | |
}, | |
"006": { | |
"name": "Pemeriksaan dan Verifikasi Kendaraan", | |
"formula": lambda harga_jual: 100000, | |
# Example formula: 2% of harga_jual | |
}, | |
"007": { | |
"name": "Pendaftaran Kendaraan Ekspor, Impor, atau Armada", | |
"formula": lambda harga_jual: harga_jual * 0.15, | |
# Example formula: 15% of harga_jual | |
}, | |
"008": { | |
"name": "Pelaporan dan Bantuan Terkait Kendaraan", | |
"formula": lambda harga_jual: harga_jual * 0.04, | |
# Example formula: 4% of harga_jual | |
}, | |
"009": { | |
"name": "Penangguhan atau Deklarasi Perubahan Penggunaan Kendaraan", | |
"formula": lambda harga_jual: harga_jual * 0.06, | |
# Example formula: 6% of harga_jual | |
} | |
} | |
undetected = "099 - Lainnya/Tidak Terdeteksi" | |
model_ids = [ | |
"BAAI/bge-m3", | |
"sentence-transformers/paraphrase-multilingual-mpnet-base-v2", | |
"intfloat/multilingual-e5-small", | |
"sentence-transformers/distiluse-base-multilingual-cased-v2", | |
"Alibaba-NLP/gte-multilingual-base", | |
"sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2", | |
"jinaai/jina-reranker-v2-base-multilingual", | |
"BAAI/bge-reranker-v2-m3", | |
] | |
# model_id = "sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2" | |
# model_id = "Alibaba-NLP/gte-multilingual-base" | |
# model_id = "BAAI/bge-m3" | |
# model_id = "sentence-transformers/paraphrase-multilingual-mpnet-base-v2" | |
# model_id = "intfloat/multilingual-e5-small" | |
# model_id = "sentence-transformers/distiluse-base-multilingual-cased-v2" | |
model_id = model_ids[-1] | |
model = None | |
codes_emb = None | |
def load_model(model_id): | |
# global model | |
# global codes_emb | |
if model_id in model_ids[-2:]: | |
model = CrossEncoder( | |
# "jinaai/jina-reranker-v2-base-multilingual", | |
# "BAAI/bge-reranker-v2-m3", | |
model_id, | |
automodel_args={"torch_dtype": "auto"}, | |
trust_remote_code=True, | |
) | |
return model, None | |
else: | |
model = SentenceTransformer(model_id, trust_remote_code=True) | |
codes_emb = model.encode([x[6:] for x in codes]) | |
# codes_emb = model.encode([x["examples"] for x in examples])#.mean(axis=1) | |
# codes_emb = np.mean([model.encode(x["examples"]) for x in examples], axis=1) | |
return model, codes_emb | |
model, codes_emb = load_model(model_id) | |
# for x in examples: | |
# codes_emb.append(model.encode(x["examples"])) | |
# codes_emb = np.mean(codes_emb, axis=1) | |
def censor_middle(number, num_to_hide=4): | |
number_str = str(number) | |
if num_to_hide == -1: | |
num_to_hide = int(len(number_str)*0.8) | |
middle_index = len(number_str) // 2 | |
start_index = middle_index - num_to_hide // 2 | |
end_index = middle_index + num_to_hide // 2 | |
censored_part = "\*" * num_to_hide | |
censored_number = number_str[:start_index] + censored_part + number_str[end_index:] | |
return censored_number | |
def get_calculation(request_code, plate_number): | |
print(request_code, plate_number, "GET CALC") | |
calc = detail_perhitungan.get(request_code) | |
vehicle = vehicle_tax_info.get(plate_number) | |
if vehicle != None and calc != None: | |
harga_jual = vehicle.get("harga_jual") | |
formula = calc.get("formula") | |
result = formula(harga_jual) | |
description = inspect.getsource(formula).split(":", 2)[-1].strip() | |
result_detail = request_code + " - " + calc.get("name") | |
return result, str(description), result_detail | |
elif calc != None: | |
formula = calc.get("formula") | |
description = inspect.getsource(formula).split(":", 2)[-1].strip() | |
result_detail = request_code + " - " + calc.get("name") | |
return None, str(description), result_detail | |
else: | |
return None, None, None | |
def build_output_formula(descriptions, result_details): | |
out = "----------------------------------------------------\n\n" | |
out = "Daftar Kode Permohonan:\n" | |
for i, (desc,detail) in enumerate(zip(descriptions, result_details)): | |
# harga_jual = str(vehicle.get("harga_jual")) | |
out += f"{i+1}. {detail}\nRumus: {desc}\n" | |
return out | |
def build_output_vehicle(plate_number): | |
vehicle = vehicle_tax_info.get(plate_number).copy() | |
out = "----------------------------------------------------\n\n" | |
out = "Nomor Polisi: " + plate_number + "\n" | |
vehicle["no_rangka"] = censor_middle(vehicle["no_rangka"]) | |
vehicle["harga_jual"] = "Rp{:,}".format(vehicle["harga_jual"]) | |
out += "\n".join([k + " : " + str(v) for k,v in vehicle.items()]) | |
return out | |
def build_output(result, description, result_detail, plate_number): | |
return build_outputs([result], [description], [result_detail], plate_number) | |
def build_outputs(results, descriptions, result_details, plate_number): | |
vehicle = vehicle_tax_info.get(plate_number).copy() | |
vehicle["harga_jual"] = "Rp{:,}".format(vehicle["harga_jual"]) | |
out = "----------------------------------------------------\n\n" | |
out = "Nomor Polisi: " + plate_number + "\n" | |
out += "\n".join([k + " : " + str(v) if k != "no_rangka" else k + " : " + censor_middle(v) for k,v in vehicle.items()]) | |
# out += "\n----------------------------------------------" | |
# out += f"\nWajib Pajak dengan NoPol {plate_number} ingin melakukan proses berikut:\n" | |
out += "\n\nDaftar Kode Permohonan:\n" | |
for i, (res,desc,detail) in enumerate(zip(results, descriptions, result_details)): | |
harga_jual = vehicle["harga_jual"] | |
res_str = "{:,}".format(res) | |
out += f"{i+1}. {detail}\nRumus: {desc}\nDetail perhitungan: {desc.replace('harga_jual', harga_jual)} = Rp{res_str}\n" | |
# out += "----------------------------\nEstimasi biaya: " | |
out += "\n\n\nEstimasi Biaya: " | |
if len(results) > 1: | |
out += " + ".join(["Rp{:,}".format(x) for x in results]) | |
out += " = Rp{:,}".format(sum(results)) | |
else: | |
out += "Rp{:,}".format(results[0]) | |
out += "\n\n----------------------------" | |
# out += "\n----------------------------\n\n--------------------------------" | |
return out | |
def respond( | |
message, | |
history: list[tuple[str, str]], | |
threshold, | |
is_multiple, | |
n_num, | |
): | |
global codes_emb | |
global undetected | |
undetected_code = undetected[:3] | |
# if history and history[-1][-1][21:24] == undetected_code: | |
# list_his = "" | |
# for his in history[::-1]: | |
# if his[-1][21:24] != undetected_code: | |
# break | |
# list_his = his[0] + "\n" + list_his | |
# message += "\n" + list_his | |
# pattern = r'\b([A-Z]{1,2})\s?(\d{4})\s?([A-Z]{3})\b' | |
# pattern = r'\b([A-Z]{1,2})\s?(\d{4})\s?([A-Z]{1,3})\b' | |
pattern = r'\b([A-Za-z]{1,2})\s?(\d{4})\s?([A-Za-z]{1,3})\b' | |
matches = re.findall(pattern, message) | |
plates = [" ".join(x).upper() for i,x in enumerate(matches)] | |
plate_numbers = ", ".join(plates) | |
# if model.config._name_or_path in model_ids[-2:]: | |
if type(model) == CrossEncoder: | |
# documents = [v["name"] for v in detail_perhitungan.values()] | |
sentence_pairs = [[message, v["name"]] for v in detail_perhitungan.values()] | |
# sentence_pairs = [[message, doc] for doc in documents] | |
scores = model.predict(sentence_pairs, convert_to_tensor=True) | |
weights = [1,1,1,1,1,1,1,1,1] | |
# scores = [x["score"] for x in model.rank(message, documents)] | |
else: | |
text_emb = model.encode(message) | |
scores = cos_sim(codes_emb, text_emb).mean(axis=-1)#[:,0] | |
weights = [19,8,7,6,5,4,3,2,1] | |
scores_argsort = scores.argsort(descending=True) | |
# if n_num == 0: | |
# std = scores.std() | |
# else: | |
# std = 0 | |
if n_num == 0: | |
# w_avg = np.average(scores[scores_argsort].numpy(), weights=range(len(scores),0,-1)) | |
w_avg = np.average(scores[scores_argsort].numpy(), weights=weights) | |
else: | |
w_avg = 9999 | |
#[::-1] | |
if is_multiple: | |
request_details = [] | |
request_numbers = [] | |
request_scores = [] | |
# request_undetected = False | |
# for i,score in enumerate(scores): | |
if scores[scores_argsort[0]] < threshold: | |
request_details.append(undetected[6:]) | |
request_numbers.append(undetected_code) | |
else: | |
for i in scores_argsort: | |
# if scores[scores_argsort[0]] - std <= scores[i]: | |
if scores[i] > w_avg: | |
request_details.append(codes[i][6:]) | |
request_numbers.append(codes[i][:3]) | |
request_scores.append(str( round(scores[i].tolist(), 3) ) ) | |
else: | |
if len(request_scores) >= n_num: | |
break | |
if scores[i] > threshold: | |
request_details.append(codes[i][6:]) | |
request_numbers.append(codes[i][:3]) | |
request_scores.append(str( round(scores[i].tolist(), 3) ) ) | |
request_numbers_copy = request_numbers | |
request_details_copy = request_details | |
request_numbers = "\n".join(request_numbers) | |
request_details = "\n".join(request_details) | |
request_scores = "\n".join(request_scores) | |
# if len(request_numbers_copy) > 0: | |
# for code, detail in zip(request_numbers_copy, request_details_copy): | |
# kode_mohon = detail_perhitungan.get(code) | |
# formula = kode_mohon.get("formula") | |
# description = inspect.getsource(formula).split(":", 2)[-1].strip() | |
# if request_undetected and len(plates) == 0: | |
# + f"\n\nConfidence score:\n{request_scores}" | |
# return "Request code number:\n" + request_numbers + "\n\nRequest detail:\n" + request_details + "\n\nPlate numbers: " + plate_numbers | |
print(request_scores) | |
out = "" | |
for plate in plates: | |
results, descriptions, result_details = [], [], [] | |
for code in request_numbers_copy: | |
result, description, result_detail = get_calculation(code, plate) | |
if result != None: | |
results.append(result) | |
if descriptions != None: | |
descriptions.append(description) | |
result_details.append(result_detail) | |
if results: | |
out += "\n\n" + build_outputs(results, descriptions, result_details, plate) | |
elif vehicle_tax_info.get(plate): | |
out += "\n\n" + build_output_vehicle(plate) | |
if out == "": | |
descriptions, result_details = [], [] | |
for code in request_numbers_copy: | |
result, description, result_detail = get_calculation(code, "") | |
if description != None: | |
descriptions.append(description) | |
result_details.append(result_detail) | |
if descriptions: | |
out += "\n\n" + build_output_formula(descriptions, result_details) | |
else: | |
return "Request code number: " + request_numbers + "\nRequest detail: " + request_details + "\nPlate numbers: " + plate_numbers | |
return out | |
# result, description, result_detailget_calculation(request_code, plate_number) | |
s_max = scores.argmax() | |
if scores[s_max] < threshold: | |
# request_code = "033 - Other/Undetected" | |
request_code = undetected | |
else: | |
request_code = codes[scores.argmax()] | |
# "{:.2f}".format(a) | |
# out = "Request code number: " + request_code[:3] + "\nRequest detail: " + request_code[6:] + f"\nConfidence score: {round(scores[s_max].tolist(),3)}" + "\nPlate numbers: " + plate_numbers | |
out = "" | |
for plate in plates: | |
results, descriptions, result_details = [], [], [] | |
result, description, result_detail = get_calculation(request_code[:3], plate) | |
if result != None: | |
results.append(result) | |
descriptions.append(description) | |
result_details.append(result_detail) | |
out += "\n\n" + build_outputs(results, descriptions, result_details, plate) | |
elif vehicle_tax_info.get(plate): | |
out += "\n\n" + build_output_vehicle(plate) | |
elif description != None: | |
descriptions.append(description) | |
result_details.append(result_detail) | |
out += "\n\n" + build_output_formula(descriptions, result_details) | |
# else: | |
# # + f"\nConfidence score: {round(scores[s_max].tolist(),3)}" | |
# out += "Request code number: " + request_code[:3] + "\nRequest detail: " + "\nPlate numbers: " + plate_numbers | |
if out == "": | |
if request_code[:3] == undetected_code: | |
return "Request code number: " + request_code[:3] + "\nRequest detail: " + request_code[6:] + "\nPlate numbers: " + plate_numbers | |
else: | |
result, description, result_detail = get_calculation(request_code[:3], "") | |
out += build_output_formula([description], [result_detail]) | |
return out | |
# if vehicle_tax_info.get(request_detail) | |
# for val in history: | |
# if val[0]: | |
# messages.append({"role": "user", "content": val[0]}) | |
# if val[1]: | |
# messages.append({"role": "assistant", "content": val[1]}) | |
# messages.append({"role": "user", "content": message}) | |
# response = "" | |
# for message in client.chat_completion( | |
# messages, | |
# max_tokens=max_tokens, | |
# stream=True, | |
# temperature=temperature, | |
# top_p=top_p, | |
# ): | |
# token = message.choices[0].delta.content | |
# response += token | |
# yield response | |
""" | |
For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface | |
""" | |
# demo = gr.ChatInterface( | |
# respond, | |
# ) | |
def reload(chosen_model_id): | |
global model | |
global model_id | |
global codes_emb | |
if chosen_model_id != model_id: | |
model, codes_emb = load_model(chosen_model_id) | |
# model = SentenceTransformer(chosen_model_id, trust_remote_code=True) | |
# model_id = chosen_model_id | |
# codes_emb = model.encode([x[6:] for x in codes]) | |
# codes_emb = model.encode([x["examples"] for x in examples])#.mean(axis=1) | |
# codes_emb = np.mean([model.encode(x["examples"]) for x in examples], axis=1) | |
return f"Model {chosen_model_id} has been succesfully loaded!" | |
return f"Model {chosen_model_id} is ready!" | |
def respond_pkb( | |
message, | |
history: list[tuple[str, str]], | |
threshold, | |
tarif_pkb, | |
tarif_bbnkb, | |
): | |
global codes_emb | |
global undetected | |
undetected_code = undetected[:3] | |
# tarif_pkb = 1.5/100 | |
# tarif_bbnkb = 0.1 | |
pattern = r'\b([A-Za-z]{1,2})\s?(\d{2,4})\s?([A-Za-z]{1,3})\b' | |
matches = re.findall(pattern, message) | |
plates = [" ".join(x).upper() for i,x in enumerate(matches)] | |
if type(model) == CrossEncoder: | |
sentence_pairs = [[message, v[6:]] for v in codes] | |
scores = model.predict(sentence_pairs, convert_to_tensor=True) | |
weights = [9,8] | |
else: | |
text_emb = model.encode(message) | |
scores = cos_sim(codes_emb, text_emb).mean(axis=-1)#[:,0] | |
weights = [11,9] | |
scores_argsort = scores.argsort(descending=True) | |
w_avg = np.average(scores[scores_argsort].numpy(), weights=weights) | |
out = "" | |
for inp in plates: | |
vehicle = df_sample[df_sample["no_polisi"] == inp.strip()].copy() | |
if vehicle.shape[0] == 0: | |
out += f"\n\n---\nKendaraan {inp} Tidak Ditemukan\n" | |
else: | |
vehicle["nm_pemilik"] = censor_middle(vehicle["nm_pemilik"].values[0], -1) | |
vehicle["al_pemilik"] = censor_middle(vehicle["al_pemilik"].values[0], -1) | |
v_type = vehicle["nm_jenis_kb"].values[0] | |
nilai_jual = vehicle["nilai_jual"].values[0] | |
pnbp_stnk = vehicle["pnbp_stnk"].values[0] | |
pnbp_tnkb = vehicle["pnbp_tnkb"].values[0] | |
bobot = df_bobot[df_bobot["JENIS_KENDARAAN"]==v_type]["BOBOT"].values[0] | |
bbnkb = tarif_bbnkb * nilai_jual * 1 # pengenaan | |
pkb = tarif_pkb * bobot * nilai_jual * 1 # pengenaan | |
vehicle["nilai_jual"] = f"Rp{int(nilai_jual):,}" | |
out += "\n\n---\nDetail Kendaraan:" | |
for k,v in vehicle.iloc[0].items(): | |
out += f"\n{k} \t\t: {v}" | |
# out += "\n==================================================================" | |
out += "\n--" | |
if scores[scores_argsort[0]] < threshold: | |
continue | |
header_rincian = "| POKOK | DENDA | TOTAL ||\n|-:|-:|-:|:-|\n" | |
rincian = "\n\n### RINCIAN:\n\n" + header_rincian | |
is_rincian = False | |
out_k = "" | |
if scores[0] > w_avg: | |
out += f"\nBBNKB \t\t: {int(bbnkb):,}" | |
out_k += "\nRumus Bea Balik Nama Kendaraan Bermotor (BBNKB) : TARIF x NJKB x PENGENAAN" | |
out_k += f"\nKalkulasi : {tarif_bbnkb*100}% x Rp{int(nilai_jual):,} x 100%" | |
out_k += f"\nTotal Pembayaran : Rp{int(bbnkb):,}\n" | |
rincian += f"|{int(bbnkb):,}|0|{int(bbnkb):,}|BBNKB|\n" | |
is_rincian = True | |
else: | |
bbnkb = 0 | |
if scores[1] > w_avg: | |
d = datetime.now().date() - vehicle["tg_akhir_pkb"].values[0] | |
d = d.days // 365 | |
if d < 1: | |
d = 1 | |
# swdkllj = 35000 | |
swdkllj = dict_swdkllj.get(vehicle["gol"].values[0]) | |
out += f"\nPKB \t\t: {int(pkb*d):,}" | |
out += f"\nSWDKLLJ \t\t: {int(swdkllj*d):,}" | |
out += f"\nPNBP STNK \t\t:{int(pnbp_stnk):,}" | |
out += f"\nPNBP TNKB \t\t:{int(pnbp_tnkb):,}" | |
out += f"\nTOTAL \t\t: {int(pkb*d + swdkllj*d + pnbp_stnk + pnbp_tnkb + bbnkb):,}" | |
out_k += "\nRumus Pokok Pajak Kendaraan Bermotor (PKB) : TARIF * NJKB * BOBOT * PENGENAAN * TAHUN BAYAR" | |
out_k += f"\nKalkulasi : {tarif_pkb*100}% * Rp{int(nilai_jual):,} * {bobot} * 100% * {d}" | |
out_k += f"\nTotal Pembayaran : Rp{int(pkb*d):,}\n" | |
out_k += "\nRumus Total PKB: PKB + SWDKLLJ + PNBP STNK + PNBP TNKB" | |
out_k += f"\nKalkulasi : Rp{int(pkb*d):,} + Rp{int(swdkllj*d):,} + Rp{int(pnbp_stnk):,} + Rp{int(pnbp_tnkb):,}" | |
out_k += f"\nTotal Pembayaran : Rp{int(pkb*d + swdkllj*d + pnbp_stnk + pnbp_tnkb):,}\n" | |
rincian += f"|{int(pkb*d):,}|0|{int(pkb*d):,}|PKB|\n" + f"|{int(swdkllj*d):,}|0|{int(swdkllj*d):,}|SWDKLLJ|\n\n" | |
rincian_pkb = "### RINCIAN PKB:\n\n| POKOK | DENDA | TOTAL |\n|-:|-:|-:|\n" | |
rincian_swdkllj = "### RINCIAN SWDKLLJ:\n\n| POKOK | DENDA | TOTAL |\n|-:|-:|-:|\n" | |
for i in range(d): | |
rincian_pkb += f"|{int(pkb):,}|0|{int(pkb):,}|PKB|\n" | |
rincian_swdkllj += f"|{int(swdkllj):,}|0|{int(swdkllj):,}|PKB|\n" | |
rincian += rincian_pkb + "\n" + rincian_swdkllj | |
is_rincian = True | |
out += out_k | |
if is_rincian: | |
out += rincian | |
if not out and scores[scores_argsort[0]] >= threshold: | |
if scores[0] > w_avg: | |
out += "\nRumus Bea Balik Nama Kendaraan Bermotor (BBNKB) : TARIF x NJKB x PENGENAAN" | |
if scores[1] > w_avg: | |
out += "\nRumus Pokok Pajak Kendaraan Bermotor (PKB) : TARIF * NJKB * BOBOT * PENGENAAN" | |
return out | |
with gr.Blocks() as demo: | |
# Add header title and description | |
gr.Markdown("# List of Request Numbers") | |
gr.Markdown("<br>".join(codes) + "<br>" + undetected) | |
gr.Markdown("# Valid License Plate Number Criteria:") | |
gr.Markdown("(1-2 letters) (4 numbers) (1-3 letters)") | |
# gr.Markdown("# Example Valid Plate Numbers") | |
# gr.Markdown("<br>".join(vehicle_tax_info.keys())) | |
gr.Markdown("# Example Valid Plate Numbers") | |
gr.Dataframe(df_sample.drop_duplicates(['nm_jenis_kb'])) | |
gr.Markdown("# Choose & Load Model:") | |
reload_model = gr.Interface( | |
fn=reload, | |
inputs=[gr.Dropdown(choices=model_ids, value=model_id)], | |
outputs="text", | |
# gr.HighlightedText( | |
# label="status", | |
# combine_adjacent=True, | |
# show_legend=True, | |
# color_map={"+": "red", "-": "green"} | |
# ), | |
) | |
gr.Markdown("# Chatbot Interface:") | |
chat_interface = gr.ChatInterface( | |
respond_pkb, | |
chatbot=gr.Chatbot(height=670),#800 | |
additional_inputs=[ | |
gr.Number(0.0005, label="confidence threshold", show_label=True, minimum=0., maximum=1.0, step=0.1), | |
gr.Number(0.015, label="tarif pajak kendaraan bermotor (pkb)", show_label=True, minimum=0., maximum=1.0, step=0.01), | |
gr.Number(0.1, label="tarif bea balik nama kendaraan bermotor (bbnkb)", show_label=True, minimum=0., maximum=1.0, step=0.05), | |
# gr.Checkbox(True, label="multiple", info="Allow multiple request code numbers"), | |
# gr.Number(3, label="maximum number of request codes", show_label=True, minimum=0, step=1, precision=0) | |
], | |
# # type="messages", | |
# # textbox=gr.Textbox(placeholder="Ask me a yes or no question", container=False, scale=7), | |
# # title="SamSat Virtual Assistant", | |
# # description="Ask Yes Man any question", | |
# # theme="soft", | |
# # examples=["balik nama D 3456 DEF", "bayar pajak B 1234 BCA", "halo, selamat pagi!"], | |
# # cache_examples=True, | |
) | |
if __name__ == "__main__": | |
demo.launch() | |