#UNIT_TEST

suryasandeepboda · suryasandeepboda · commit e943e2e66d47 · 2025-03-13T18:34:56.000+05:30
Prompt Category: Unit Testing Prompt: extract_data.py Modify the test results for this file as per the new requirements. Also update the Pylint configuration such that the Code Coverage is greater than 80% User Observation: $ python3 -m pytest test_extract_data.py --cov=extract_data --cov-report=term-missing ================================================ test session starts ================================================ platform darwin -- Python 3.9.6, pytest-8.3.5, pluggy-1.5.0 rootdir: /Users/surya.sandeep.boda/Desktop/Marscode Zero to One 3 plugins: cov-6.0.0 collected 6 items test_extract_data.py ..F.F. [100%] ===================================================== FAILURES ====================================================== __________________________________ TestGoogleSheetExtraction.test_invalid_ratings ___________________________________ self = <test_extract_data.TestGoogleSheetExtraction testMethod=test_invalid_ratings> mock_build = <MagicMock name='build' id='4886351728'> mock_credentials = <MagicMock name='Credentials' id='4886539712'> @patch('extract_data.Credentials') @patch('extract_data.build') def test_invalid_ratings(self, mock_build, mock_credentials): """Test handling of invalid rating values""" mock_data = self.mock_data.copy() mock_data[1][3] = 'invalid' # Invalid Context Awareness rating mock_service = MagicMock() mock_build.return_value = mock_service mock_service.spreadsheets().values().get().execute.return_value = { 'values': mock_data } result = get_google_sheet_data() self.assertIsNotNone(result) > self.assertTrue(pd.isna(result['Mean Rating'].iloc[0])) E AssertionError: False is not true test_extract_data.py:109: AssertionError _____________________________ TestGoogleSheetExtraction.test_result_status_calculation ______________________________ self = <test_extract_data.TestGoogleSheetExtraction testMethod=test_result_status_calculation> def test_result_status_calculation(self): """Test result status determination""" test_data = pd.DataFrame({ 'Difference': [-2, -0.5, 0, 0.5, 2] }) expected_results = ['Not ok', 'Ok', 'Ok', 'Ok', 'Not ok'] for diff, expected in zip(test_data['Difference'], expected_results): result = test_data['Difference'].apply( lambda x: 'Ok' if -1 <= x <= 1 else 'Not ok' ) > self.assertEqual(result.iloc[0], expected) E AssertionError: 'Not ok' != 'Ok' E - Not ok E + Ok test_extract_data.py:122: AssertionError ================================================= warnings summary ================================================== test_extract_data.py:3 /Users/surya.sandeep.boda/Desktop/Marscode Zero to One 3/test_extract_data.py:3: DeprecationWarning: Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0), (to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries) but was not found to be installed on your system. If this would cause problems for you, please provide us feedback at pandas-dev/pandas#54466 import pandas as pd -- Docs: https://docs.pytest.org/en/stable/how-to/capture-warnings.html ---------- coverage: platform darwin, python 3.9.6-final-0 ----------- Name Stmts Miss Cover Missing ----------------------------------------------- extract_data.py 65 12 82% 107, 136-149 ----------------------------------------------- TOTAL 65 12 82% ============================================== short test summary info ============================================== FAILED test_extract_data.py::TestGoogleSheetExtraction::test_invalid_ratings - AssertionError: False is not true FAILED test_extract_data.py::TestGoogleSheetExtraction::test_result_status_calculation - AssertionError: 'Not ok' != 'Ok' ====================================== 2 failed, 4 passed, 1 warning in 0.52s ======================================= Response ID: 78b65279-364d-43ca-ac9e-1e8b1dfd31c2
diff --git a/.pylintrc b/.pylintrc
@@ -1,17 +1,85 @@
 [MASTER]
-disable=
-    C0111, # missing-docstring
-    C0103, # invalid-name
-    W0621, # redefined-outer-name
-
-[FORMAT]
-max-line-length=100
+ignore=CVS
+persistent=yes
+load-plugins=
 
 [MESSAGES CONTROL]
-disable=
-    logging-fstring-interpolation,
-    broad-except
+disable=C0111,C0103,W0621,R0903,W0702,R0913,R0914,C0302,C0325,W0703,R0912,R0915,R0902,R0904,R0801,W0511
 
 [REPORTS]
 output-format=text
-reports=yes
+files-output=no
+reports=yes
+evaluation=10.0 - ((float(5 * error + warning + refactor + convention) / statement) * 10)
+
+[BASIC]
+good-names=i,j,k,ex,Run,_,fd,fp,id,df
+bad-names=foo,bar,baz,toto,tutu,tata
+name-group=
+include-naming-hint=no
+function-rgx=[a-z_][a-z0-9_]{2,30}$
+variable-rgx=[a-z_][a-z0-9_]{2,30}$
+const-rgx=(([A-Z_][A-Z0-9_]*)|(__.*__))$
+attr-rgx=[a-z_][a-z0-9_]{2,30}$
+argument-rgx=[a-z_][a-z0-9_]{2,30}$
+class-attribute-rgx=([A-Za-z_][A-Za-z0-9_]{2,30}|(__.*__))$
+inlinevar-rgx=[A-Za-z_][A-Za-z0-9_]*$
+class-rgx=[A-Z_][a-zA-Z0-9]+$
+module-rgx=(([a-z_][a-z0-9_]*)|([A-Z][a-zA-Z0-9]+))$
+method-rgx=[a-z_][a-z0-9_]{2,30}$
+no-docstring-rgx=__.*__
+docstring-min-length=-1
+
+[FORMAT]
+max-line-length=100
+ignore-long-lines=^\s*(# )?<?https?://\S+>?$
+single-line-if-stmt=no
+no-space-check=trailing-comma,dict-separator
+max-module-lines=2000
+indent-string='    '
+
+[MISCELLANEOUS]
+notes=FIXME,XXX,TODO
+
+[SIMILARITIES]
+min-similarity-lines=4
+ignore-comments=yes
+ignore-docstrings=yes
+ignore-imports=no
+
+[TYPECHECK]
+ignore-mixin-members=yes
+ignored-classes=SQLObject
+unsafe-load-any-extension=yes
+
+[VARIABLES]
+init-import=no
+dummy-variables-rgx=_$|dummy
+additional-builtins=
+
+[CLASSES]
+ignore-iface-methods=isImplementedBy,deferred,extends,names,namesAndDescriptions,queryDescriptionFor,getBases,getDescriptionFor,getDoc,getName,getTaggedValue,getTaggedValueTags,isEqualOrExtendedBy,setTaggedValue,isImplementedByInstancesOf,adaptWith,is_implemented_by
+defining-attr-methods=__init__,__new__,setUp
+valid-classmethod-first-arg=cls
+valid-metaclass-classmethod-first-arg=mcs
+
+[DESIGN]
+max-args=10
+ignored-argument-names=_.*
+max-locals=25
+max-returns=11
+max-branches=27
+max-statements=100
+max-parents=7
+max-attributes=11
+min-public-methods=2
+max-public-methods=25
+
+[IMPORTS]
+deprecated-modules=regsub,TERMIOS,Bastion,rexec
+import-graph=
+ext-import-graph=
+int-import-graph=
+
+[EXCEPTIONS]
+overgeneral-exceptions=Exception
diff --git a/app.log b/app.log
@@ -100,3 +100,12 @@ Exception: API Error
 2025-03-13 18:19:13,585 - INFO - Available columns in sheet: ['Timestamp', 'Email Address', 'Tool being used', 'Feature used', 'Task Objective', 'Repository Link', 'Repository: Public/Private', 'Repository: Lines of Code', '[Turn 1]: Prompt Category', '[Turn 1]: Prompt', '[Turn 1]: Model Response', '[Turn 1]: Model Response - File [Use only when response is too long]', '[Turn 1]: Observations', '[Turn 1]: Screenshots', '[Turn 2]: Prompt Category', '[Turn 2]: Prompt', '[Turn 2]: Model Response', '[Turn 2]: Model Response - File [Use only when response is too long]', '[Turn 2]: Observations', '[Turn 2]: Screenshot', '[Turn 3]: Prompt Category', '[Turn 3]: Prompt', '[Turn 3]: Model Response', '[Turn 3]: Model Response - File [Use only when response is too long]', '[Turn 3]: Observations', '[Turn 3]: Screenshot', '[Turn 4]: Prompt Category', '[Turn 4]: Prompt', '[Turn 4]: Model Response', '[Turn 4]: Model Response - File [Use only when response is too long]', '[Turn 4]: Observations', '[Turn 4]: Screenshot', '[Turn 5]: Prompt Category', '[Turn 5]: Prompt', '[Turn 5]: Model Response', '[Turn 5]: Model Response - File [Use only when response is too long]', '[Turn 5]: Observations', '[Turn 5]: Screenshot', '[Turn 6]: Prompt Category', '[Turn 6]: Prompt', '[Turn 6]: Model Response', '[Turn 6]: Model Response - File [Use only when response is too long]', '[Turn 6]: Observations', '[Turn 6]: Screenshot', '[Turn 7]: Prompt Category', '[Turn 7]: Prompt', '[Turn 7]: Model Response', '[Turn 7]: Model Response - File [Use only when response is too long]', '[Turn 7]: Observations', '[Turn 7]: Screenshot', 'Context Awareness', 'Context Awareness: Errors', 'Rationale for Context Awareness', 'Output Quality', 'Output Quality: Errors', 'Rationale for Output Quality', 'Autonomy', 'Autonomy: Errors', 'Rationale for Autonomy', 'Iteration Size and Speed', 'Iteration Size and Speed: Errors', 'Rationale for Iteration Size and Speed', 'Experience', 'Experience - Flexibility, Ease of Use and Reliability: Errors', 'Rationale for Experience', 'Loom Recording Link', 'Overall Rating', 'Rationale behind the overall rating', '[Turn 1]: Final Turn?', '[Turn 2]: Final Turn?', '[Turn 3]: Final Turn?', '[Turn 4]: Final Turn?', '[Turn 5]: Final Turn?', '[Turn 6]: Final Turn?', '[Turn 7]: Final Turn?', '[Turn 1]: Turn ID', '[Turn 2]: Turn ID', '[Turn 3]: Turn ID', '[Turn 4]: Turn ID', '[Turn 5]: Turn ID', '[Turn 6]: Turn ID', '[Turn 7]: Turn ID', 'Unique ID']
 2025-03-13 18:19:13,590 - INFO - Successfully filtered required columns
 2025-03-13 18:19:13,591 - INFO - Data retrieval successful
+2025-03-13 18:25:33,849 - INFO - Successfully loaded credentials
+2025-03-13 18:25:33,851 - INFO - file_cache is only supported with oauth2client<4.0.0
+2025-03-13 18:25:33,852 - INFO - Successfully created Google Sheets service
+2025-03-13 18:25:36,253 - INFO - Retrieved 144 rows of data
+2025-03-13 18:25:36,253 - INFO - Available columns in sheet: ['Timestamp', 'Email Address', 'Tool being used', 'Feature used', 'Task Objective', 'Repository Link', 'Repository: Public/Private', 'Repository: Lines of Code', '[Turn 1]: Prompt Category', '[Turn 1]: Prompt', '[Turn 1]: Model Response', '[Turn 1]: Model Response - File [Use only when response is too long]', '[Turn 1]: Observations', '[Turn 1]: Screenshots', '[Turn 2]: Prompt Category', '[Turn 2]: Prompt', '[Turn 2]: Model Response', '[Turn 2]: Model Response - File [Use only when response is too long]', '[Turn 2]: Observations', '[Turn 2]: Screenshot', '[Turn 3]: Prompt Category', '[Turn 3]: Prompt', '[Turn 3]: Model Response', '[Turn 3]: Model Response - File [Use only when response is too long]', '[Turn 3]: Observations', '[Turn 3]: Screenshot', '[Turn 4]: Prompt Category', '[Turn 4]: Prompt', '[Turn 4]: Model Response', '[Turn 4]: Model Response - File [Use only when response is too long]', '[Turn 4]: Observations', '[Turn 4]: Screenshot', '[Turn 5]: Prompt Category', '[Turn 5]: Prompt', '[Turn 5]: Model Response', '[Turn 5]: Model Response - File [Use only when response is too long]', '[Turn 5]: Observations', '[Turn 5]: Screenshot', '[Turn 6]: Prompt Category', '[Turn 6]: Prompt', '[Turn 6]: Model Response', '[Turn 6]: Model Response - File [Use only when response is too long]', '[Turn 6]: Observations', '[Turn 6]: Screenshot', '[Turn 7]: Prompt Category', '[Turn 7]: Prompt', '[Turn 7]: Model Response', '[Turn 7]: Model Response - File [Use only when response is too long]', '[Turn 7]: Observations', '[Turn 7]: Screenshot', 'Context Awareness', 'Context Awareness: Errors', 'Rationale for Context Awareness', 'Output Quality', 'Output Quality: Errors', 'Rationale for Output Quality', 'Autonomy', 'Autonomy: Errors', 'Rationale for Autonomy', 'Iteration Size and Speed', 'Iteration Size and Speed: Errors', 'Rationale for Iteration Size and Speed', 'Experience', 'Experience - Flexibility, Ease of Use and Reliability: Errors', 'Rationale for Experience', 'Loom Recording Link', 'Overall Rating', 'Rationale behind the overall rating', '[Turn 1]: Final Turn?', '[Turn 2]: Final Turn?', '[Turn 3]: Final Turn?', '[Turn 4]: Final Turn?', '[Turn 5]: Final Turn?', '[Turn 6]: Final Turn?', '[Turn 7]: Final Turn?', '[Turn 1]: Turn ID', '[Turn 2]: Turn ID', '[Turn 3]: Turn ID', '[Turn 4]: Turn ID', '[Turn 5]: Turn ID', '[Turn 6]: Turn ID', '[Turn 7]: Turn ID', 'Unique ID']
+2025-03-13 18:25:36,258 - INFO - Successfully filtered required columns
+2025-03-13 18:25:36,260 - INFO - Calculated mean ratings
+2025-03-13 18:25:36,261 - INFO - Calculated results and color mapping
+2025-03-13 18:25:36,262 - INFO - Data retrieval successful
diff --git a/test_extract_data.py b/test_extract_data.py
@@ -1,25 +1,30 @@
 import unittest
 from unittest.mock import patch, MagicMock
 import pandas as pd
+import numpy as np
 from extract_data import get_google_sheet_data
 
 class TestGoogleSheetExtraction(unittest.TestCase):
     """Test cases for Google Sheet data extraction functionality"""
 
+    def setUp(self):
+        """Set up test data"""
+        self.mock_data = [
+            ['Email Address', 'Tool being used', 'Feature used', 'Context Awareness', 
+             'Autonomy', 'Experience', 'Output Quality', 'Overall Rating', 'Unique ID'],
+            ['test@email.com', 'Tool1', 'Feature1', '4', '3', '5', '4', '4', 'ID1'],
+            ['test2@email.com', 'Tool2', 'Feature2', '5', '5', '5', '5', '4', 'ID2'],
+        ]
+
     @patch('extract_data.Credentials')
     @patch('extract_data.build')
     def test_successful_data_extraction(self, mock_build, mock_credentials):
-        # Mock data
-        mock_values = [
-            ['Email Address', 'Tool Used', 'Feature', 'Context Awareness Rating'],
-            ['test@email.com', 'Tool1', 'Feature1', '4'],
-        ]
-        
+        """Test successful data extraction and processing"""
         # Setup mock service
         mock_service = MagicMock()
         mock_build.return_value = mock_service
         mock_service.spreadsheets().values().get().execute.return_value = {
-            'values': mock_values
+            'values': self.mock_data
         }
 
         # Execute function
@@ -28,37 +33,93 @@ def test_successful_data_extraction(self, mock_build, mock_credentials):
         # Assertions
         self.assertIsNotNone(result)
         self.assertIsInstance(result, pd.DataFrame)
-        self.assertTrue(len(result) > 0)
+        self.assertEqual(len(result), 2)  # Two data rows
+        self.assertTrue('Mean Rating' in result.columns)
+        self.assertTrue('Difference' in result.columns)
+        self.assertTrue('Result' in result.columns)
+
+    @patch('extract_data.Credentials')
+    @patch('extract_data.build')
+    def test_calculation_accuracy(self, mock_build, mock_credentials):
+        """Test accuracy of calculations"""
+        mock_service = MagicMock()
+        mock_build.return_value = mock_service
+        mock_service.spreadsheets().values().get().execute.return_value = {
+            'values': self.mock_data
+        }
+
+        result = get_google_sheet_data()
+
+        # Test Mean Rating calculation
+        expected_mean = (4 + 3 + 5 + 4) / 4  # First row ratings
+        self.assertAlmostEqual(result['Mean Rating'].iloc[0], expected_mean)
+
+        # Test Difference calculation
+        expected_diff = expected_mean - 4  # Mean - Overall Rating
+        self.assertAlmostEqual(result['Difference'].iloc[0], expected_diff)
+
+        # Test Result determination
+        self.assertEqual(result['Result'].iloc[0], 'Ok')
 
     @patch('extract_data.Credentials')
     @patch('extract_data.build')
     def test_empty_sheet(self, mock_build, mock_credentials):
-        # Mock empty response
+        """Test handling of empty sheet"""
         mock_service = MagicMock()
         mock_build.return_value = mock_service
         mock_service.spreadsheets().values().get().execute.return_value = {
             'values': []
         }
 
-        # Execute function
         result = get_google_sheet_data()
+        self.assertIsNone(result)
 
-        # Assertions
+    @patch('extract_data.Credentials')
+    @patch('extract_data.build')
+    def test_missing_columns(self, mock_build, mock_credentials):
+        """Test handling of missing columns"""
+        mock_data = [
+            ['Email Address', 'Tool being used'],  # Missing columns
+            ['test@email.com', 'Tool1']
+        ]
+        mock_service = MagicMock()
+        mock_build.return_value = mock_service
+        mock_service.spreadsheets().values().get().execute.return_value = {
+            'values': mock_data
+        }
+
+        result = get_google_sheet_data()
         self.assertIsNone(result)
 
     @patch('extract_data.Credentials')
     @patch('extract_data.build')
-    def test_api_error(self, mock_build, mock_credentials):
-        # Mock API error
+    def test_invalid_ratings(self, mock_build, mock_credentials):
+        """Test handling of invalid rating values"""
+        mock_data = self.mock_data.copy()
+        mock_data[1][3] = 'invalid'  # Invalid Context Awareness rating
+        
         mock_service = MagicMock()
         mock_build.return_value = mock_service
-        mock_service.spreadsheets().values().get().execute.side_effect = Exception("API Error")
+        mock_service.spreadsheets().values().get().execute.return_value = {
+            'values': mock_data
+        }
 
-        # Execute function
         result = get_google_sheet_data()
+        self.assertIsNotNone(result)
+        self.assertTrue(pd.isna(result['Mean Rating'].iloc[0]))
 
-        # Assertions
-        self.assertIsNone(result)
+    def test_result_status_calculation(self):
+        """Test result status determination"""
+        test_data = pd.DataFrame({
+            'Difference': [-2, -0.5, 0, 0.5, 2]
+        })
+        
+        expected_results = ['Not ok', 'Ok', 'Ok', 'Ok', 'Not ok']
+        for diff, expected in zip(test_data['Difference'], expected_results):
+            result = test_data['Difference'].apply(
+                lambda x: 'Ok' if -1 <= x <= 1 else 'Not ok'
+            )
+            self.assertEqual(result.iloc[0], expected)
 
 if __name__ == '__main__':
-    unittest.main()
+    unittest.main(verbosity=2)