Move tests from tap tester (#29)

author asaf-erlich <aerlich@talend.com>

Tue, 2 Mar 2021 20:58:22 +0000 (12:58 -0800)

committer GitHub <noreply@github.com>

Tue, 2 Mar 2021 20:58:22 +0000 (12:58 -0800)
author asaf-erlich <aerlich@talend.com>
Tue, 2 Mar 2021 20:58:22 +0000 (12:58 -0800)
committer GitHub <noreply@github.com>
Tue, 2 Mar 2021 20:58:22 +0000 (12:58 -0800)
diff --git a/.circleci/config.yml b/.circleci/config.yml

index 577428f7d0fc72892b242d2cab7b9fe187cdebeb..4a51c9ff5c947fab7b7b871c1a6d6cb44dba83cb 100644 (file)
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@@ -16,12 +16,6 @@ jobs:
              pip install .
              pip install pylint
              pylint tap_google_sheets -d C,R,W
-      - run:
-          name: 'Unit Tests'
-          command: |
-            source ~/.virtualenvs/tap-google-sheets/bin/activate
-            pip install nose
-            nosetests
        - run:
            name: 'JSON Validator'
            command: |
@@ -34,13 +28,13 @@ jobs:
              aws s3 cp s3://com-stitchdata-dev-deployment-assets/environments/tap-tester/sandbox dev_env.sh
              source dev_env.sh
              source /usr/local/share/virtualenvs/tap-tester/bin/activate
-            run-a-test --tap=tap-google-sheets \
-                       --target=target-stitch \
-                       --orchestrator=stitch-orchestrator \
-                       --email=harrison+sandboxtest@stitchdata.com \
-                       --password=$SANDBOX_PASSWORD \
-                       --client-id=50 \
-                       tap_tester.suites.google_sheets
+            run-test --tap=tap-google-sheets \
+                     --target=target-stitch \
+                     --orchestrator=stitch-orchestrator \
+                     --email=harrison+sandboxtest@stitchdata.com \
+                     --password=$SANDBOX_PASSWORD \
+                     --client-id=50 \
+                     tests/tap_combined_test.py
        - slack/notify-on-failure:
            only_for_branches: master
  
diff --git a/.gitignore b/.gitignore

index d9633da72e963e1bc5d87cd416114ef18c3e60fe..fc5cd0f413ed58bcfb40bda4c818f78f020f5b23 100644 (file)
--- a/.gitignore
+++ b/.gitignore
@@ -18,5 +18,4 @@ build/
  tap_google_sheets/.vscode/settings.json
  *.ipynb
  .DS_Store
-test_configuration.py
  tap_target_commands.sh
diff --git a/tests/__init__.py b/tests/__init__.py

new file mode 100644 (file)

index 0000000..e69de29
diff --git a/tests/tap_combined_test.py b/tests/tap_combined_test.py

new file mode 100644 (file)

index 0000000..5e2a3c5
--- /dev/null
+++ b/tests/tap_combined_test.py
@@ -0,0 +1,122 @@
+import unittest
+import os
+from datetime import datetime as dt
+from datetime import timedelta
+
+from tap_tester import menagerie
+import tap_tester.runner as runner
+import tap_tester.connections as connections
+from tap_tester.scenario import SCENARIOS
+
+
+class TapCombinedTest(unittest.TestCase):
+    START_DATE_FORMAT = "%Y-%m-%dT00:00:00Z"
+
+    @staticmethod
+    def name():
+        return "tap_google_sheets_combined_test"
+
+    @staticmethod
+    def tap_name():
+        return "tap-google-sheets"
+
+    @staticmethod
+    def get_type():
+        return "platform.google-sheets"
+
+    def expected_check_streams(self):
+        return set(self.expected_pks().keys())
+
+    def expected_sync_streams(self):
+        return set(self.expected_pks().keys())
+
+    @staticmethod
+    def expected_pks():
+        return {
+            "file_metadata": {"id"},
+            "sheet_metadata": {"sheetId"},
+            "sheets_loaded": {"spreadsheetId", "sheetId", "loadDate"},
+            "spreadsheet_metadata": {"spreadsheetId"},
+            "Test-1": {"__sdc_row"},
+            "Test 2": {"__sdc_row"},
+            "SKU COGS": {"__sdc_row"},
+            "Item Master": {"__sdc_row"},
+            "Retail Price": {"__sdc_row"},
+            "Retail Price NEW": {"__sdc_row"},
+            "Forecast Scenarios": {"__sdc_row"},
+            "Promo Type": {"__sdc_row"},
+            "Shipping Method": {"__sdc_row"}
+        }
+
+
+    def get_properties(self):
+        return_value = {
+            'start_date': dt.strftime(dt.utcnow() - timedelta(days=3), self.START_DATE_FORMAT),
+            'spreadsheet_id': os.getenv("TAP_GOOGLE_SHEETS_SPREADSHEET_ID")
+        }
+
+        return return_value
+
+    @staticmethod
+    def get_credentials():
+        return {
+            "client_id": os.getenv("TAP_GOOGLE_SHEETS_CLIENT_ID"),
+            "client_secret": os.getenv("TAP_GOOGLE_SHEETS_CLIENT_SECRET"),
+            "refresh_token": os.getenv("TAP_GOOGLE_SHEETS_REFRESH_TOKEN"),
+        }
+
+    def setUp(self):
+        missing_envs = [x for x in [
+            "TAP_GOOGLE_SHEETS_SPREADSHEET_ID",
+            "TAP_GOOGLE_SHEETS_START_DATE",
+            "TAP_GOOGLE_SHEETS_CLIENT_ID",
+            "TAP_GOOGLE_SHEETS_CLIENT_SECRET",
+            "TAP_GOOGLE_SHEETS_REFRESH_TOKEN",
+        ] if os.getenv(x) is None]
+
+        if missing_envs:
+            raise Exception("Missing environment variables: {}".format(missing_envs))
+
+    def test_run(self):
+
+        conn_id = connections.ensure_connection(self, payload_hook=None)
+
+        # Run the tap in check mode
+        check_job_name = runner.run_check_mode(self, conn_id)
+
+        # Verify the check's exit status
+        exit_status = menagerie.get_exit_status(conn_id, check_job_name)
+        menagerie.verify_check_exit_status(self, exit_status, check_job_name)
+
+        # Verify that there are catalogs found
+        found_catalogs = menagerie.get_catalogs(conn_id)
+        self.assertGreater(len(found_catalogs), 0, msg="unable to locate schemas for connection {}".format(conn_id))
+
+        found_catalog_names = set(map(lambda c: c['tap_stream_id'], found_catalogs))
+        subset = self.expected_check_streams().issubset(found_catalog_names)
+        self.assertTrue(subset, msg="Expected check streams are not subset of discovered catalog")
+        #
+        # # Select some catalogs
+        our_catalogs = [c for c in found_catalogs if c.get('tap_stream_id') in self.expected_sync_streams()]
+        for catalog in our_catalogs:
+            schema = menagerie.get_annotated_schema(conn_id, catalog['stream_id'])
+            connections.select_catalog_and_fields_via_metadata(conn_id, catalog, schema, [], [])
+
+        # # Verify that all streams sync at least one row for initial sync
+        # # This test is also verifying access token expiration handling. If test fails with
+        # # authentication error, refresh token was not replaced after expiring.
+        menagerie.set_state(conn_id, {})
+        sync_job_name = runner.run_sync_mode(self, conn_id)
+
+        # # Verify tap and target exit codes
+        exit_status = menagerie.get_exit_status(conn_id, sync_job_name)
+        menagerie.verify_sync_exit_status(self, exit_status, sync_job_name)
+        record_count_by_stream = runner.examine_target_output_file(self, conn_id, self.expected_sync_streams(),
+                                                                   self.expected_pks())
+        zero_count_streams = {k for k, v in record_count_by_stream.items() if v == 0}
+        self.assertFalse(zero_count_streams,
+                         msg="The following streams did not sync any rows {}".format(zero_count_streams))
+
+
+
+SCENARIOS.add(TapCombinedTest)
author	asaf-erlich <aerlich@talend.com>
	Tue, 2 Mar 2021 20:58:22 +0000 (12:58 -0800)
committer	GitHub <noreply@github.com>
	Tue, 2 Mar 2021 20:58:22 +0000 (12:58 -0800)
.circleci/config.yml		patch \| blob \| blame \| history
.gitignore		patch \| blob \| blame \| history
tests/__init__.py	[new file with mode: 0644]	patch \| blob
tests/tap_combined_test.py	[new file with mode: 0644]	patch \| blob