Spaces:

GuglielmoTor
/

LinkedinMonitor

Sleeping

App Files Files Community

GuglielmoTor commited on May 16

Commit

97314bb

verified ·

1 Parent(s): 2c911b1

Update Linkedin_Data_API_Calls.py

Browse files

Files changed (1) hide show

Linkedin_Data_API_Calls.py +47 -18

Linkedin_Data_API_Calls.py CHANGED Viewed

@@ -276,21 +276,34 @@ def fetch_linkedin_posts_core(comm_client_id, community_token, org_urn, count):
 def fetch_comments(comm_client_id, community_token, post_urns, stats_map):
     """
-    Fetches comments for a list of post URNs.
     Uses stats_map to potentially skip posts with 0 comments.
     """
-    token_dict = community_token if isinstance(community_token, dict) else {'access_token': community_token, 'token_type': 'Bearer'}
     linkedin_session = create_session(comm_client_id, token=token_dict)
-    linkedin_session.headers.update({
-        'LinkedIn-Version': "202502"
-        })
     all_comments_by_post = {}
     logging.info(f"Fetching comments for {len(post_urns)} posts.")
     for post_urn in post_urns:
         post_stats = stats_map.get(post_urn, {})
-        comment_count_from_stats = post_stats.get("commentSummary", {}).get("totalComments", post_stats.get('commentCount', 0))
         if comment_count_from_stats == 0:
             logging.info(f"Skipping comment fetch for {post_urn} as commentCount is 0 in stats_map.")
@@ -298,8 +311,11 @@ def fetch_comments(comm_client_id, community_token, post_urns, stats_map):
             continue
         try:
-            encoded_post_urn = quote(post_urn, safe='')
-            url = f"{API_REST_BASE}/comments?q=entity&entityUrn={encoded_post_urn}&sortOrder=CHRONOLOGICAL"
             logging.debug(f"Fetching comments from URL: {url} for post URN: {post_urn}")
             response = linkedin_session.get(url)
@@ -308,28 +324,41 @@ def fetch_comments(comm_client_id, community_token, post_urns, stats_map):
                 elements = response.json().get('elements', [])
                 comments_texts = []
                 for c in elements:
-                    comment_text = c.get('message', {}).get('text')
-                    if comment_text:
-                         comments_texts.append(comment_text)
                 all_comments_by_post[post_urn] = comments_texts
                 logging.info(f"Fetched {len(comments_texts)} comments for {post_urn}.")
             elif response.status_code == 403:
-                 logging.warning(f"Forbidden (403) to fetch comments for {post_urn}. URL: {url}. Response: {response.text}. Check permissions or API version.")
-                 all_comments_by_post[post_urn] = []
             elif response.status_code == 404:
-                 logging.warning(f"Comments not found (404) for {post_urn}. URL: {url}. Response: {response.text}")
-                 all_comments_by_post[post_urn] = []
             else:
                 logging.error(f"Error fetching comments for {post_urn}. Status: {response.status_code}. URL: {url}. Response: {response.text}")
-                all_comments_by_post[post_urn] = []
         except requests.exceptions.RequestException as e:
             logging.error(f"RequestException fetching comments for {post_urn}: {e}")
             all_comments_by_post[post_urn] = []
         except json.JSONDecodeError as e:
-            logging.error(f"JSONDecodeError fetching comments for {post_urn}. Response: {response.text if 'response' in locals() else 'N/A'}. Error: {e}")
             all_comments_by_post[post_urn] = []
         except Exception as e:
-            logging.error(f"Unexpected error fetching comments for {post_urn}: {e}")
             all_comments_by_post[post_urn] = []
     return all_comments_by_post

 def fetch_comments(comm_client_id, community_token, post_urns, stats_map):
     """
+    Fetches comments for a list of post URNs using the socialActions endpoint.
     Uses stats_map to potentially skip posts with 0 comments.
     """
+    # Ensure community_token is in the expected dictionary format for create_session
+    if isinstance(community_token, str):
+        token_dict = {'access_token': community_token, 'token_type': 'Bearer'}
+    elif isinstance(community_token, dict) and 'access_token' in community_token:
+        token_dict = community_token
+    else:
+        logging.error("Invalid community_token format. Expected a string or a dict with 'access_token'.")
+        return {urn: [] for urn in post_urns} # Return empty for all if token is bad
     linkedin_session = create_session(comm_client_id, token=token_dict)
+    # Set the LinkedIn API version header
+    # This is crucial for API compatibility.
+    linkedin_session.headers.update({
+        'LinkedIn-Version': "202502" # Or your target version
+    })
     all_comments_by_post = {}
     logging.info(f"Fetching comments for {len(post_urns)} posts.")
     for post_urn in post_urns:
         post_stats = stats_map.get(post_urn, {})
+        # Try to get comment count from "commentSummary" first, then fallback to "commentCount"
+        comment_summary = post_stats.get("commentSummary", {})
+        comment_count_from_stats = comment_summary.get("totalComments", post_stats.get('commentCount', 0))
         if comment_count_from_stats == 0:
             logging.info(f"Skipping comment fetch for {post_urn} as commentCount is 0 in stats_map.")
             continue
         try:
+            # IMPORTANT: Use the correct endpoint structure from your working code.
+            # The post_urn goes directly into the path and should NOT be URL-encoded here.
+            url = f"{API_REST_BASE}/socialActions/{post_urn}/comments?sortOrder=CHRONOLOGICAL"
+            # If you want to add other parameters like 'count' or 'start', append them, e.g.,
+            # url = f"{API_REST_BASE}/socialActions/{post_urn}/comments?sortOrder=CHRONOLOGICAL&count=10"
             logging.debug(f"Fetching comments from URL: {url} for post URN: {post_urn}")
             response = linkedin_session.get(url)
                 elements = response.json().get('elements', [])
                 comments_texts = []
                 for c in elements:
+                    # Extracting comment text. Adjust if the structure is different.
+                    # The original working code stored `data.get('elements', [])`
+                    # If you need the full comment object, store 'c' instead of 'comment_text'.
+                    message_obj = c.get('message', {})
+                    if isinstance(message_obj, dict): # Ensure message is a dict before .get('text')
+                        comment_text = message_obj.get('text')
+                        if comment_text:
+                            comments_texts.append(comment_text)
+                    elif isinstance(message_obj, str): # Sometimes message might be just a string
+                        comments_texts.append(message_obj)
                 all_comments_by_post[post_urn] = comments_texts
                 logging.info(f"Fetched {len(comments_texts)} comments for {post_urn}.")
             elif response.status_code == 403:
+                logging.warning(f"Forbidden (403) to fetch comments for {post_urn}. URL: {url}. Response: {response.text}. Check permissions or API version.")
+                all_comments_by_post[post_urn] = [] # Or some error indicator
             elif response.status_code == 404:
+                logging.warning(f"Comments not found (404) for {post_urn}. URL: {url}. Response: {response.text}")
+                all_comments_by_post[post_urn] = []
             else:
                 logging.error(f"Error fetching comments for {post_urn}. Status: {response.status_code}. URL: {url}. Response: {response.text}")
+                all_comments_by_post[post_urn] = [] # Or some error indicator
         except requests.exceptions.RequestException as e:
             logging.error(f"RequestException fetching comments for {post_urn}: {e}")
             all_comments_by_post[post_urn] = []
         except json.JSONDecodeError as e:
+            # Log the response text if it's available and JSON decoding fails
+            response_text_for_log = 'N/A'
+            if 'response' in locals() and hasattr(response, 'text'):
+                response_text_for_log = response.text
+            logging.error(f"JSONDecodeError fetching comments for {post_urn}. Response: {response_text_for_log}. Error: {e}")
             all_comments_by_post[post_urn] = []
         except Exception as e:
+            # Catch any other unexpected errors
+            logging.error(f"Unexpected error fetching comments for {post_urn}: {e}", exc_info=True) # exc_info=True for traceback
             all_comments_by_post[post_urn] = []
     return all_comments_by_post