test_common_clean.py 596 B

1234567891011121314151617181920
  1. import pytest
  2. from dw_base.spark.udf.test.common_clean import clean_pre_join
  3. @pytest.mark.parametrize("name, expected", [
  4. ('MS ABC Ltd.', 'ABC'),
  5. ('MS ABC I PRIVATE LIMITED', 'ABC'),
  6. ("M S ABC COMPANY PRIVATE L", 'ABC'),
  7. ('ABC Ltd.', 'ABC'),
  8. ('ABC P LTD', 'ABC'),
  9. ('ABC PRIVATE LIMITED', 'ABC'),
  10. ('ABC LIMITED', 'ABC'),
  11. ('ABC INC', 'ABC'),
  12. ('ABC AAA', 'ABC AAA'),
  13. ('ABC CO LIMITED', 'ABC'),
  14. ('ABC AND CO LIMITED', 'ABC AND CO LIMITED'),
  15. ('ABC COLTD', 'ABC'),
  16. ])
  17. def test_clean_pre_join(name, expected):
  18. assert clean_pre_join(name) == expected