| PASS |
CRITICAL |
__table__ |
row_count |
Table should have >= 23000000 rows |
1 |
1 |
0 |
100.00% |
|
| PASS |
WARNING |
person |
not_null |
person should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
CRITICAL |
record_id |
not_null |
record_id should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| ERROR |
INFO |
reg_addr_koatuu |
text_null |
reg_addr_koatuu should not contain text representations of NULL |
- |
- |
- |
- |
Flight returned internal error, with message: Error while expanding view nessie.mvs.reestrtz. Failed to execute POST request against 'http://nessie:19120/api/v2/trees/main%40919c71db00429064a3236801ea7239e9146841bbb2883b5298095536669970dd/contents'.
View SQL SELECT
record_id,
person,
reg_addr_koatuu,
r.oper_code,
UPPER(o.oper_name) AS oper_name,
o."condition" AS oper_car_condition,
o.short AS short_oper_name,
o.description AS oper_description,
o.notes AS oper_notes,
o.owner_change,
o.is_import,
o.is_aid,
o.is_credit_leasing,
o.modification_type,
o.document_basis,
o.entity_type,
o.is_wartime,
o.is_digital,
o.is_stolen_related,
o.is_insurer,
o.is_social,
d_reg,
r.dep_code,
d.dep,
d.region AS dep_region,
d.city AS dep_city,
d.address AS dep_address,
d.address_number AS dep_address_number,
d.description AS dep_description,
d.hours_of_work AS dep_hours_of_work,
d.phones AS dep_phones,
brand_lat AS brand,
model_lat AS model,
autodata_generations AS generation,
model_suffix,
make_year,
vin_model_year AS model_year,
vin_year_code,
INITCAP(color) AS color,
kind,
body,
autodata_possible_body_types AS possible_body_types,
body_subtype,
body_modifiers,
vehicle_class,
trailer_prefix,
INITCAP(purpose) AS purpose,
main_fuel AS fuel,
secondary_fuel,
is_gbo,
is_hybrid,
fuel_notes,
autodata_possible_fuels AS possible_fuels,
capacity,
autodata_possible_displacements AS possible_displacements,
own_weight,
total_weight,
payload,
n_reg_cleaned AS n_reg_new_cyrillic,
n_reg_latin,
has_old_cyrillic,
plate_type,
region_code,
is_valid_plate,
validation_error,
INITCAP(region_name_final) AS region_name,
needs_moderation,
raw_vin,
vin_latin AS vin,
is_valid_vin,
vin_validation_error,
vin_length,
vin_is_17,
vin_has_ioq,
vin_wmi,
vin_wmi_manufacturer,
vin_wmi_region,
vin_wmi_known,
autodata_possible_transmissions AS possible_transmissions,
autodata_possible_drives AS possible_drives,
backfill_confidence,
backfill_stage
FROM "nessie"."mvs"."raw_reestrtz" at branch main AS r
LEFT JOIN "nessie"."mvs"."dim"."oper_codes" AS o ON o.oper_code = r.oper_code
LEFT JOIN "nessie"."mvs"."dim"."dep" AS d ON d.dep_code = r.dep_code
SQL Query
SELECT /*+ no_reflections */
COUNT(*) AS total,
SUM(CASE WHEN UPPER(CAST("reg_addr_koatuu" AS VARCHAR)) IN ('NULL', 'NONE', 'N/A', 'NA', 'NAN', '-', '#N/A', '#NULL!')
OR CAST("reg_addr_koatuu" AS VARCHAR) = ''
THEN 1 ELSE 0 END) AS failed
FROM nessie.mvs.reestrtz AT BRANCH "main"
WHERE "reg_addr_koatuu" IS NOT NULL
|
| PASS |
WARNING |
person |
text_null |
person should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
reg_addr_koatuu |
null_distribution |
reg_addr_koatuu: 611393 null (2.5%), 23841590 not null (97.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
person |
allowed_values |
person should be in allowed set |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
CRITICAL |
record_id |
text_null |
record_id should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
reg_addr_koatuu |
distinct_count |
reg_addr_koatuu: 28715 distinct values |
23841590 |
23841590 |
0 |
100.00% |
|
| INFO |
INFO |
oper_code |
null_distribution |
oper_code: 78 null (0.0%), 24452905 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
oper_code |
distinct_count |
oper_code: 187 distinct values |
24452905 |
24452905 |
0 |
100.00% |
|
| INFO |
INFO |
oper_car_condition |
null_distribution |
oper_car_condition: 6999915 null (28.6%), 17453068 not null (71.4%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
oper_car_condition |
text_null |
oper_car_condition should not contain text representations of NULL |
17453068 |
17453068 |
0 |
100.00% |
|
| INFO |
INFO |
oper_name |
distinct_count |
oper_name: 180 distinct values |
24450909 |
24450909 |
0 |
100.00% |
|
| INFO |
INFO |
oper_name |
null_distribution |
oper_name: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
short_oper_name |
null_distribution |
short_oper_name: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
oper_car_condition |
allowed_values |
oper_car_condition should be in allowed set |
17453068 |
17453068 |
0 |
100.00% |
|
| PASS |
INFO |
short_oper_name |
text_null |
short_oper_name should not contain text representations of NULL |
24450909 |
24450909 |
0 |
100.00% |
|
| INFO |
INFO |
oper_description |
null_distribution |
oper_description: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
short_oper_name |
distinct_count |
short_oper_name: 5 distinct values |
24450909 |
24450909 |
0 |
100.00% |
|
| PASS |
INFO |
oper_description |
text_null |
oper_description should not contain text representations of NULL |
24450909 |
24450909 |
0 |
100.00% |
|
| INFO |
INFO |
oper_notes |
null_distribution |
oper_notes: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
owner_change |
null_distribution |
owner_change: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
oper_notes |
text_null |
oper_notes should not contain text representations of NULL |
24450909 |
24450909 |
0 |
100.00% |
|
| INFO |
INFO |
is_aid |
null_distribution |
is_aid: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
is_credit_leasing |
null_distribution |
is_credit_leasing: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
modification_type |
null_distribution |
modification_type: 23099378 null (94.5%), 1353605 not null (5.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
is_import |
null_distribution |
is_import: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
modification_type |
text_null |
modification_type should not contain text representations of NULL |
1353605 |
1353605 |
0 |
100.00% |
|
| PASS |
INFO |
modification_type |
allowed_values |
modification_type should be in allowed set |
1353605 |
1353605 |
0 |
100.00% |
|
| INFO |
INFO |
entity_type |
null_distribution |
entity_type: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
document_basis |
null_distribution |
document_basis: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
entity_type |
text_null |
entity_type should not contain text representations of NULL |
24450909 |
24450909 |
0 |
100.00% |
|
| PASS |
INFO |
document_basis |
text_null |
document_basis should not contain text representations of NULL |
24450909 |
24450909 |
0 |
100.00% |
|
| PASS |
INFO |
entity_type |
allowed_values |
entity_type should be in allowed set |
24450909 |
24450909 |
0 |
100.00% |
|
| INFO |
INFO |
is_stolen_related |
null_distribution |
is_stolen_related: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
is_wartime |
null_distribution |
is_wartime: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
is_digital |
null_distribution |
is_digital: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
is_insurer |
null_distribution |
is_insurer: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
is_social |
null_distribution |
is_social: 2074 null (0.0%), 24450909 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
d_reg |
not_null |
d_reg should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
d_reg |
date_range |
d_reg should be between 2010-01-01 and today |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
dep_code |
not_null |
dep_code should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
d_reg |
distinct_count |
d_reg: 4658 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
dep_code |
text_null |
dep_code should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
dep_code |
distinct_count |
dep_code: 665 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
dep |
null_distribution |
dep: 1 null (0.0%), 24452982 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
dep_code |
regex |
dep_code should match ^\d+$ |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
dep |
distinct_count |
dep: 498 distinct values |
24452982 |
24452982 |
0 |
100.00% |
|
| PASS |
INFO |
dep |
text_null |
dep should not contain text representations of NULL |
24452982 |
24452982 |
0 |
100.00% |
|
| INFO |
INFO |
dep_region |
null_distribution |
dep_region: 1 null (0.0%), 24452982 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
dep_region |
text_null |
dep_region should not contain text representations of NULL |
24452982 |
24452982 |
0 |
100.00% |
|
| INFO |
INFO |
dep_region |
distinct_count |
dep_region: 25 distinct values |
24452982 |
24452982 |
0 |
100.00% |
|
| INFO |
INFO |
dep_city |
null_distribution |
dep_city: 5432997 null (22.2%), 19019986 not null (77.8%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
dep_city |
text_null |
dep_city should not contain text representations of NULL |
19019986 |
19019986 |
0 |
100.00% |
|
| INFO |
INFO |
dep_city |
distinct_count |
dep_city: 144 distinct values |
19019986 |
19019986 |
0 |
100.00% |
|
| INFO |
INFO |
dep_address |
null_distribution |
dep_address: 5432997 null (22.2%), 19019986 not null (77.8%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
dep_address |
text_null |
dep_address should not contain text representations of NULL |
19019986 |
19019986 |
0 |
100.00% |
|
| PASS |
INFO |
oper_name |
text_null |
oper_name should not contain text representations of NULL |
24450909 |
24450909 |
0 |
100.00% |
|
| PASS |
INFO |
dep_address_number |
text_null |
dep_address_number should not contain text representations of NULL |
18880457 |
18880457 |
0 |
100.00% |
|
| INFO |
INFO |
dep_address_number |
null_distribution |
dep_address_number: 5572526 null (22.8%), 18880457 not null (77.2%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
dep_description |
null_distribution |
dep_description: 23721422 null (97.0%), 731561 not null (3.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
dep_description |
text_null |
dep_description should not contain text representations of NULL |
731561 |
731561 |
0 |
100.00% |
|
| INFO |
INFO |
dep_hours_of_work |
null_distribution |
dep_hours_of_work: 5433478 null (22.2%), 19019505 not null (77.8%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
dep_hours_of_work |
text_null |
dep_hours_of_work should not contain text representations of NULL |
19019505 |
19019505 |
0 |
100.00% |
|
| INFO |
INFO |
dep_phones |
null_distribution |
dep_phones: 6323464 null (25.9%), 18129519 not null (74.1%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
dep_phones |
text_null |
dep_phones should not contain text representations of NULL |
18129519 |
18129519 |
0 |
100.00% |
|
| INFO |
INFO |
brand |
null_distribution |
brand: 2270 null (0.0%), 24450713 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
model |
null_distribution |
model: 8344 null (0.0%), 24444639 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
brand |
distinct_count |
brand: 4289 distinct values |
24450713 |
24450713 |
0 |
100.00% |
|
| FAIL |
WARNING |
brand |
text_null |
brand should not contain text representations of NULL |
24450713 |
24450710 |
3 |
100.00% |
|
| INFO |
INFO |
model |
distinct_count |
model: 35521 distinct values |
24444639 |
24444639 |
0 |
100.00% |
|
| PASS |
WARNING |
model |
text_null |
model should not contain text representations of NULL |
24444639 |
24444639 |
0 |
100.00% |
|
| INFO |
INFO |
model_suffix |
null_distribution |
model_suffix: 18959675 null (77.5%), 5493308 not null (22.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| FAIL |
INFO |
model_suffix |
text_null |
model_suffix should not contain text representations of NULL |
5493308 |
5493014 |
294 |
99.99% |
|
| INFO |
INFO |
generation |
array_length |
generation: avg array len=2.4, min=0, max=12 |
17942491 |
17942491 |
0 |
100.00% |
|
| FAIL |
INFO |
generation |
array_empty |
generation should not contain empty arrays |
17942491 |
16832475 |
1110016 |
93.81% |
|
| INFO |
INFO |
model_suffix |
distinct_count |
model_suffix: 9460 distinct values |
5493308 |
5493308 |
0 |
100.00% |
|
| INFO |
INFO |
make_year |
distinct_count |
make_year: 108 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
make_year |
not_null |
make_year should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
model_year |
null_distribution |
model_year: 9160598 null (37.5%), 15292385 not null (62.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
make_year |
range |
make_year should be in range [1900, 2027] |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
model_year |
distinct_count |
model_year: 60 distinct values |
15292385 |
15292385 |
0 |
100.00% |
|
| FAIL |
INFO |
model_year |
range |
model_year should be in range [1900, 2027] |
15292385 |
15138467 |
153918 |
98.99% |
|
| INFO |
INFO |
vin_year_code |
null_distribution |
vin_year_code: 6682681 null (27.3%), 17770302 not null (72.7%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin_year_code |
distinct_count |
vin_year_code: 35 distinct values |
17770302 |
17770302 |
0 |
100.00% |
|
| PASS |
INFO |
vin_year_code |
text_null |
vin_year_code should not contain text representations of NULL |
17770302 |
17770302 |
0 |
100.00% |
|
| PASS |
WARNING |
color |
not_null |
color should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
color |
distinct_count |
color: 14 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
kind |
not_null |
kind should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
generation |
text_null_array |
generation array should not contain text representations of NULL |
17942491 |
17942491 |
0 |
100.00% |
|
| INFO |
INFO |
body |
null_distribution |
body: 14441 null (0.1%), 24438542 not null (99.9%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
kind |
distinct_count |
kind: 14 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
color |
text_null |
color should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
WARNING |
kind |
text_null |
kind should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
body |
distinct_count |
body: 75 distinct values |
24438542 |
24438542 |
0 |
100.00% |
|
| INFO |
INFO |
possible_body_types |
array_length |
possible_body_types: avg array len=1.7, min=1, max=6 |
17942491 |
17942491 |
0 |
100.00% |
|
| PASS |
INFO |
body |
text_null |
body should not contain text representations of NULL |
24438542 |
24438542 |
0 |
100.00% |
|
| PASS |
INFO |
possible_body_types |
array_empty |
possible_body_types should not contain empty arrays |
17942491 |
17942491 |
0 |
100.00% |
|
| INFO |
INFO |
body_subtype |
null_distribution |
body_subtype: 23095097 null (94.4%), 1357886 not null (5.6%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
body_subtype |
distinct_count |
body_subtype: 36 distinct values |
1357886 |
1357886 |
0 |
100.00% |
|
| PASS |
INFO |
body_subtype |
text_null |
body_subtype should not contain text representations of NULL |
1357886 |
1357886 |
0 |
100.00% |
|
| PASS |
INFO |
body_modifiers |
text_null |
body_modifiers should not contain text representations of NULL |
808817 |
808817 |
0 |
100.00% |
|
| INFO |
INFO |
body_modifiers |
distinct_count |
body_modifiers: 12 distinct values |
808817 |
808817 |
0 |
100.00% |
|
| INFO |
INFO |
vehicle_class |
null_distribution |
vehicle_class: 11946373 null (48.9%), 12506610 not null (51.1%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
body_modifiers |
null_distribution |
body_modifiers: 23644166 null (96.7%), 808817 not null (3.3%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
vehicle_class |
text_null |
vehicle_class should not contain text representations of NULL |
12506610 |
12506610 |
0 |
100.00% |
|
| INFO |
INFO |
vehicle_class |
distinct_count |
vehicle_class: 18 distinct values |
12506610 |
12506610 |
0 |
100.00% |
|
| INFO |
INFO |
trailer_prefix |
null_distribution |
trailer_prefix: 23298291 null (95.3%), 1154692 not null (4.7%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
trailer_prefix |
distinct_count |
trailer_prefix: 2 distinct values |
1154692 |
1154692 |
0 |
100.00% |
|
| PASS |
INFO |
trailer_prefix |
text_null |
trailer_prefix should not contain text representations of NULL |
1154692 |
1154692 |
0 |
100.00% |
|
| PASS |
WARNING |
purpose |
not_null |
purpose should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
fuel |
null_distribution |
fuel: 1163992 null (4.8%), 23288991 not null (95.2%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
purpose |
distinct_count |
purpose: 3 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
fuel |
text_null |
fuel should not contain text representations of NULL |
23288991 |
23288991 |
0 |
100.00% |
|
| INFO |
INFO |
secondary_fuel |
null_distribution |
secondary_fuel: 19622957 null (80.2%), 4830026 not null (19.8%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
fuel |
distinct_count |
fuel: 4 distinct values |
23288991 |
23288991 |
0 |
100.00% |
|
| PASS |
INFO |
secondary_fuel |
text_null |
secondary_fuel should not contain text representations of NULL |
4830026 |
4830026 |
0 |
100.00% |
|
| PASS |
WARNING |
purpose |
text_null |
purpose should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
secondary_fuel |
distinct_count |
secondary_fuel: 3 distinct values |
4830026 |
4830026 |
0 |
100.00% |
|
| INFO |
INFO |
is_gbo |
null_distribution |
is_gbo: 1158444 null (4.7%), 23294539 not null (95.3%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
is_hybrid |
range |
is_hybrid should be in range [0, 1] |
23294539 |
23294539 |
0 |
100.00% |
|
| INFO |
INFO |
is_hybrid |
null_distribution |
is_hybrid: 1158444 null (4.7%), 23294539 not null (95.3%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
is_gbo |
range |
is_gbo should be in range [0, 1] |
23294539 |
23294539 |
0 |
100.00% |
|
| PASS |
INFO |
fuel_notes |
text_null |
fuel_notes should not contain text representations of NULL |
5322263 |
5322263 |
0 |
100.00% |
|
| INFO |
INFO |
fuel_notes |
null_distribution |
fuel_notes: 19130720 null (78.2%), 5322263 not null (21.8%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
fuel_notes |
distinct_count |
fuel_notes: 4 distinct values |
5322263 |
5322263 |
0 |
100.00% |
|
| PASS |
INFO |
possible_body_types |
text_null_array |
possible_body_types array should not contain text representations of NULL |
17942491 |
17942491 |
0 |
100.00% |
|
| INFO |
INFO |
capacity |
null_distribution |
capacity: 1162993 null (4.8%), 23289990 not null (95.2%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
capacity |
distinct_count |
capacity: 6051 distinct values |
23289990 |
23289990 |
0 |
100.00% |
|
| INFO |
INFO |
possible_fuels |
array_length |
possible_fuels: avg array len=2.0, min=1, max=6 |
17942491 |
17942491 |
0 |
100.00% |
|
| PASS |
INFO |
possible_fuels |
array_empty |
possible_fuels should not contain empty arrays |
17942491 |
17942491 |
0 |
100.00% |
|
| FAIL |
INFO |
capacity |
range |
capacity should be in range [0, 20000] |
23289990 |
23289673 |
317 |
100.00% |
|
| INFO |
INFO |
possible_displacements |
array_length |
possible_displacements: avg array len=4.7, min=0, max=20 |
17942491 |
17942491 |
0 |
100.00% |
|
| FAIL |
INFO |
possible_displacements |
array_empty |
possible_displacements should not contain empty arrays |
17942491 |
17516536 |
425955 |
97.63% |
|
| INFO |
INFO |
own_weight |
null_distribution |
own_weight: 89607 null (0.4%), 24363376 not null (99.6%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
own_weight |
distinct_count |
own_weight: 14219 distinct values |
24363376 |
24363376 |
0 |
100.00% |
|
| PASS |
INFO |
possible_displacements |
array_range |
possible_displacements array elements should be in range [0, 20000] |
84935358 |
84935358 |
0 |
100.00% |
|
| PASS |
INFO |
possible_fuels |
text_null_array |
possible_fuels array should not contain text representations of NULL |
17942491 |
17942491 |
0 |
100.00% |
|
| INFO |
INFO |
total_weight |
null_distribution |
total_weight: 13287 null (0.1%), 24439696 not null (99.9%) |
24452983 |
24452983 |
0 |
100.00% |
|
| FAIL |
INFO |
own_weight |
range |
own_weight should be in range [40, 45000] |
24363376 |
24341083 |
22293 |
99.91% |
|
| INFO |
INFO |
total_weight |
distinct_count |
total_weight: 9630 distinct values |
24439696 |
24439696 |
0 |
100.00% |
|
| FAIL |
INFO |
total_weight |
range |
total_weight should be in range [60, 90000] |
24439696 |
24436417 |
3279 |
99.99% |
|
| INFO |
INFO |
payload |
null_distribution |
payload: 91766 null (0.4%), 24361217 not null (99.6%) |
24452983 |
24452983 |
0 |
100.00% |
|
| FAIL |
INFO |
payload |
range |
payload should be in range [0, 35000] |
24361217 |
24336693 |
24524 |
99.90% |
|
| INFO |
INFO |
n_reg_new_cyrillic |
null_distribution |
n_reg_new_cyrillic: 98849 null (0.4%), 24354134 not null (99.6%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
payload |
distinct_count |
payload: 25084 distinct values |
24361217 |
24361217 |
0 |
100.00% |
|
| INFO |
INFO |
n_reg_latin |
null_distribution |
n_reg_latin: 103011 null (0.4%), 24349972 not null (99.6%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
n_reg_new_cyrillic |
text_null |
n_reg_new_cyrillic should not contain text representations of NULL |
24354134 |
24354134 |
0 |
100.00% |
|
| PASS |
INFO |
n_reg_latin |
text_null |
n_reg_latin should not contain text representations of NULL |
24349972 |
24349972 |
0 |
100.00% |
|
| INFO |
INFO |
has_old_cyrillic |
null_distribution |
has_old_cyrillic: 0 null (0.0%), 24452983 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
has_old_cyrillic |
distinct_count |
has_old_cyrillic: 2 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
plate_type |
not_null |
plate_type should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
plate_type |
distinct_count |
plate_type: 6 distinct values |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
plate_type |
text_null |
plate_type should not contain text representations of NULL |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
plate_type |
allowed_values |
plate_type should be in allowed set |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
region_code |
null_distribution |
region_code: 1688453 null (6.9%), 22764530 not null (93.1%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
is_valid_plate |
not_null |
is_valid_plate should not be null or empty |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
region_code |
distinct_count |
region_code: 167 distinct values |
22764530 |
22764530 |
0 |
100.00% |
|
| INFO |
INFO |
n_reg_latin |
distinct_count |
n_reg_latin: 16724367 distinct values |
24349972 |
24349972 |
0 |
100.00% |
|
| INFO |
INFO |
n_reg_new_cyrillic |
distinct_count |
n_reg_new_cyrillic: 16814791 distinct values |
24354134 |
24354134 |
0 |
100.00% |
|
| PASS |
INFO |
region_code |
text_null |
region_code should not contain text representations of NULL |
22764530 |
22764530 |
0 |
100.00% |
|
| INFO |
INFO |
validation_error |
distinct_count |
validation_error: 1 distinct values |
1684296 |
1684296 |
0 |
100.00% |
|
| PASS |
INFO |
validation_error |
text_null |
validation_error should not contain text representations of NULL |
1684296 |
1684296 |
0 |
100.00% |
|
| INFO |
INFO |
validation_error |
null_distribution |
validation_error: 22768687 null (93.1%), 1684296 not null (6.9%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
needs_moderation |
null_distribution |
needs_moderation: 0 null (0.0%), 24452983 not null (100.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
region_name |
null_distribution |
region_name: 1784078 null (7.3%), 22668905 not null (92.7%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
raw_vin |
null_distribution |
raw_vin: 6480405 null (26.5%), 17972578 not null (73.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
region_name |
distinct_count |
region_name: 29 distinct values |
22668905 |
22668905 |
0 |
100.00% |
|
| INFO |
INFO |
vin |
null_distribution |
vin: 6480406 null (26.5%), 17972577 not null (73.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
raw_vin |
text_null |
raw_vin should not contain text representations of NULL |
17972578 |
17972578 |
0 |
100.00% |
|
| INFO |
INFO |
is_valid_vin |
null_distribution |
is_valid_vin: 6480034 null (26.5%), 17972949 not null (73.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
vin |
text_null |
vin should not contain text representations of NULL |
17972577 |
17972577 |
0 |
100.00% |
|
| INFO |
INFO |
raw_vin |
distinct_count |
raw_vin: 9210043 distinct values |
17972578 |
17972578 |
0 |
100.00% |
|
| INFO |
INFO |
vin_validation_error |
distinct_count |
vin_validation_error: 4 distinct values |
215935 |
215935 |
0 |
100.00% |
|
| PASS |
INFO |
vin_validation_error |
text_null |
vin_validation_error should not contain text representations of NULL |
215935 |
215935 |
0 |
100.00% |
|
| INFO |
INFO |
vin_length |
distinct_count |
vin_length: 27 distinct values |
17972578 |
17972578 |
0 |
100.00% |
|
| INFO |
INFO |
vin_length |
null_distribution |
vin_length: 6480405 null (26.5%), 17972578 not null (73.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin_validation_error |
null_distribution |
vin_validation_error: 24237048 null (99.1%), 215935 not null (0.9%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin |
distinct_count |
vin: 9209050 distinct values |
17972577 |
17972577 |
0 |
100.00% |
|
| INFO |
INFO |
vin_is_17 |
null_distribution |
vin_is_17: 6480034 null (26.5%), 17972949 not null (73.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin_has_ioq |
null_distribution |
vin_has_ioq: 6480034 null (26.5%), 17972949 not null (73.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi |
null_distribution |
vin_wmi: 6682681 null (27.3%), 17770302 not null (72.7%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
vin_wmi |
text_null |
vin_wmi should not contain text representations of NULL |
17770302 |
17770302 |
0 |
100.00% |
|
| PASS |
INFO |
region_name |
text_null |
region_name should not contain text representations of NULL |
22668905 |
22668905 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi |
distinct_count |
vin_wmi: 9330 distinct values |
17770302 |
17770302 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi_manufacturer |
null_distribution |
vin_wmi_manufacturer: 7205306 null (29.5%), 17247677 not null (70.5%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi_manufacturer |
distinct_count |
vin_wmi_manufacturer: 1695 distinct values |
17247677 |
17247677 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi_region |
null_distribution |
vin_wmi_region: 6697032 null (27.4%), 17755951 not null (72.6%) |
24452983 |
24452983 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi_region |
distinct_count |
vin_wmi_region: 6 distinct values |
17755951 |
17755951 |
0 |
100.00% |
|
| PASS |
INFO |
vin_wmi_region |
text_null |
vin_wmi_region should not contain text representations of NULL |
17755951 |
17755951 |
0 |
100.00% |
|
| INFO |
INFO |
vin_wmi_known |
null_distribution |
vin_wmi_known: 6682310 null (27.3%), 17770673 not null (72.7%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
vin_wmi_manufacturer |
text_null |
vin_wmi_manufacturer should not contain text representations of NULL |
17247677 |
17247677 |
0 |
100.00% |
|
| INFO |
INFO |
possible_transmissions |
array_length |
possible_transmissions: avg array len=1.7, min=0, max=2 |
17942491 |
17942491 |
0 |
100.00% |
|
| FAIL |
INFO |
possible_transmissions |
array_empty |
possible_transmissions should not contain empty arrays |
17942491 |
17773314 |
169177 |
99.06% |
|
| INFO |
INFO |
possible_drives |
array_length |
possible_drives: avg array len=1.4, min=0, max=3 |
17942491 |
17942491 |
0 |
100.00% |
|
| INFO |
INFO |
backfill_confidence |
null_distribution |
backfill_confidence: 17847166 null (73.0%), 6605817 not null (27.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
backfill_confidence |
text_null |
backfill_confidence should not contain text representations of NULL |
6605817 |
6605817 |
0 |
100.00% |
|
| FAIL |
INFO |
possible_drives |
array_empty |
possible_drives should not contain empty arrays |
17942491 |
17848191 |
94300 |
99.47% |
|
| PASS |
INFO |
backfill_confidence |
allowed_values |
backfill_confidence should be in allowed set |
6605817 |
6605817 |
0 |
100.00% |
|
| INFO |
INFO |
backfill_stage |
null_distribution |
backfill_stage: 17847166 null (73.0%), 6605817 not null (27.0%) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
backfill_stage |
text_null |
backfill_stage should not contain text representations of NULL |
6605817 |
6605817 |
0 |
100.00% |
|
| PASS |
INFO |
backfill_stage |
allowed_values |
backfill_stage should be in allowed set |
6605817 |
6605817 |
0 |
100.00% |
|
| FAIL |
WARNING |
own_weight_lt_total_weight |
custom_sql |
own_weight має бути менший за total_weight |
24361217 |
24360711 |
506 |
100.00% |
|
| FAIL |
WARNING |
weight_ratio_too_high |
custom_sql |
total_weight / own_weight не має перевищувати 4 |
24340478 |
23665816 |
674662 |
97.23% |
|
| FAIL |
INFO |
vin_null_before_2021 |
custom_sql |
VIN має бути NULL для реєстрацій до 2021-01-01 |
13085851 |
6480034 |
6605817 |
49.52% |
|
| FAIL |
INFO |
make_year_vs_model_year |
custom_sql |
model_year (з VIN) не має відрізнятись від make_year більш ніж на 2 роки |
15292385 |
12733635 |
2558750 |
83.27% |
|
| PASS |
WARNING |
negative_weight |
custom_sql |
Від'ємна вага (own_weight або total_weight < 0) |
24441855 |
24441855 |
0 |
100.00% |
|
| PASS |
WARNING |
future_make_year |
custom_sql |
Автомобілі з майбутнього (make_year > поточний рік + 1) |
24452983 |
24452983 |
0 |
100.00% |
|
| PASS |
INFO |
possible_drives |
text_null_array |
possible_drives array should not contain text representations of NULL |
17942491 |
17942491 |
0 |
100.00% |
|
| PASS |
INFO |
possible_transmissions |
text_null_array |
possible_transmissions array should not contain text representations of NULL |
17942491 |
17942491 |
0 |
100.00% |
|