Merge pull request #21 from jvaleroliet/new_features

jvaleroliet · web-flow · commit a8ce6ada38d0 · 2024-07-17T13:21:54.000+02:00
added new functionalities
diff --git a/pykobo/form.py b/pykobo/form.py
@@ -69,7 +69,6 @@ def fetch_data(self) -> Union[pd.DataFrame, dict]:
 
         # If the form has at least one repeat group
         if self.has_repeats:
-
             self._extract_repeats(data)
 
             # In the parent DF delete the columns that contain the repeat groups
@@ -162,6 +161,27 @@ def display(self, columns_as: str = "name", choices_as: str = "name") -> None:
                     )
             self.__choices_as = choices_as
 
+    def fetch_media(self):
+        """Fetch the form's media files and store them as a Pandas DF in the attribute `media`."""
+        # Create media url
+        media_url = f"{self.base_url}/{self.uid}/files/?format=json"
+        # Request media and extract dataframe
+        res = requests.get(url=media_url, headers=self.headers)
+        media = res.json()["results"]
+        if not media.empty:
+            media[["hash", "filename", "mimetype"]] = pd.json_normalize(media.metadata)
+        self.media = pd.DataFrame(media)
+
+    def fetch_attachments(self, media_columns: list):
+        """
+        This function returns attached media in new columns,
+        one for each question with media, given df."""
+
+        for column in media_columns:
+            self.data["media_" + column] = self.data.apply(
+                lambda x: self._obtain_url(x, column), axis=1
+            )
+
     def _get_survey(self) -> None:
         """Go through all the elements of the survey and build the root structure (and the structure
         of the repeat groups if any) as a list of `Question` objects. Each `Question` object has a name
@@ -182,16 +202,13 @@ def _get_survey(self) -> None:
         in_repeat = False
 
         for field in survey:
-
             # Identify groups and repeats if any
             if field["type"] == "begin_group":
-
                 group_name = field["name"]
                 if "label" in field:
                     group_label = field["label"]
 
             if field["type"] == "begin_repeat":
-
                 repeat_name = field["name"]
                 if "label" in field:
                     repeat_label = field["label"]
@@ -218,7 +235,6 @@ def _get_survey(self) -> None:
                 and field["type"] != "end_group"
                 and field["type"] != "end_repeat"
             ):
-
                 name_q = field["$autoname"]
                 if "label" in field:
                     label_q = field["label"][0]
@@ -272,7 +288,8 @@ def _get_survey(self) -> None:
 
     def _get_choices(self):
         """For all the questions of type 'select_one' or 'select_multiple' assign their corresponding choices.
-        Each choice has a name and label so it's possible to display the data using any of the two."""
+        Each choice has a name and label so it's possible to display the data using any of the two.
+        """
 
         formatted_choices = {}
         choices = self.__content["choices"]
@@ -398,7 +415,6 @@ def _remove_unused_columns(self) -> None:
             "formhub/uuid",
             "meta/instanceID",
             "_xform_id_string",
-            "_attachments",
             "meta/deprecatedID",
             "_geolocation",
         ]
@@ -425,6 +441,31 @@ def _rename_columns_labels_duplicates(self, structure: list) -> None:
                 duplicates_count[q.label] += 1
                 q.label = f"{q.label} ({duplicates_count[q.label]})"
 
+    def _obtain_url(self, row, column):
+            """Aux Function to obtain url of an attached file.
+            Replaces the ' ' (spaces) by '_' from the attached files"""
+
+            df = pd.json_normalize(row["_attachments"])
+            if "filename" in df.columns:
+                df["filename_ok"] = df["filename"].apply(
+                    lambda x: x.split("/")[-1].replace(" ", "_")
+                )
+
+                if pd.isna(row[column]):
+                    name = None
+                else:
+                    name = row[column].replace(" ", "_")
+
+                if name is not None:
+                    matching_rows = df.loc[df["filename_ok"] == name]
+                    if not matching_rows.empty:
+                        url = matching_rows["download_url"].iloc[0]
+                    else:
+                        url = np.nan
+                else:
+                    url = np.nan
+                return url
+
     def _split_gps_coords(self) -> None:
         """Split the columns of type 'geopoint' into 4 new columns
         'latitude', 'longitude', 'altitude', 'gps_precision'
diff --git a/pykobo/manager.py b/pykobo/manager.py
@@ -1,3 +1,7 @@
+import json
+import logging
+import os
+import time
 from typing import Union
 
 import requests
@@ -79,3 +83,142 @@ def get_form(self, uid: str) -> Union[KoboForm, None]:
         kform = self._create_koboform(form)
 
         return kform
+
+    def redeploy_form(self, uid: str) -> None:
+        url = f"{self.url}/api/v{self.api_version}/assets/{uid}/deployment/?format=json"
+        requests.patch(url=url, headers=self.headers)
+
+    def upload_media_from_local(
+        self, uid: str, folder_path: str, file_name: str, rewrite: bool = False
+    ) -> None:
+        file_extension = os.path.splitext(file_name)[1]
+        valid_media = [".jpeg", ".jpg", ".png", ".csv", ".JPGE", ".JPG", ".PNG"]
+
+        if not folder_path.endswith(("/", "\\")):
+            folder_path += "/"
+
+        if file_extension not in valid_media:
+            raise ValueError(
+                "upload_media_from_local: file extension must be one of %r."
+                % valid_media
+            )
+
+        file_path = os.path.join(folder_path, file_name)
+
+        if not os.path.exists(file_path):
+            raise FileNotFoundError(f"File not found: {file_path}")
+
+        self._upload_media(uid, open(file_path, "rb"), file_name, rewrite)
+
+    def upload_media_from_server(
+        self, uid: str, media_data: bytes, file_name: str, rewrite: bool = False
+    ) -> None:
+        self._upload_media(uid, media_data, file_name, rewrite)
+
+    def _upload_media(
+        self, uid: str, media_data: bytes, file_name: str, rewrite: bool
+    ) -> None:
+        url_media = f"{self.url}/api/v{self.api_version}/assets/{uid}/files"
+        payload = {"filename": file_name}
+        data = {
+            "description": "default",
+            "metadata": json.dumps(payload),
+            "data_value": file_name,
+            "file_type": "form_media",
+        }
+
+        res = requests.get(f"{url_media}.json", headers=self.headers)
+        res.raise_for_status()
+        dict_response = res.json()["results"]
+
+        for each in dict_response:
+            if each["metadata"]["filename"] == file_name:
+                if rewrite:
+                    del_id = each["uid"]
+                    res.status_code = 403
+                    while res.status_code != 204:
+                        res = requests.delete(
+                            f"{url_media}/{del_id}", headers=self.headers
+                        )
+                        time.sleep(1)
+                    break
+                else:
+                    raise ValueError(
+                        "There is already a file with the same name! Select a new name or set 'rewrite=True'"
+                    )
+
+        files = {"content": (file_name, media_data)}  # Pass media_data directly
+
+        res = requests.post(
+            url=f"{url_media}.json", data=data, files=files, headers=self.headers
+        )
+        res.raise_for_status()
+
+        if res.status_code == 201:
+            logging.info(f"Successfully uploaded {file_name} to {uid} form.")
+        else:
+            logging.error(f"Unsuccessful. Response code: {str(res.status_code)}")
+
+    def share_project(self, uid: str, user: str, permission: str):
+        """
+        Share a project with a user.
+
+        Parameters
+        ----------
+        uid : str
+            The project's uid.
+        user : str
+            The user's uid.
+        permission : str
+            The permission to give the user.
+        """
+
+        valid_permissions = [
+            "add_submissions",
+            "change_asset",
+            "change_submissions",
+            "delete_submissions",
+            "discover_asset",
+            "manage_asset",
+            "partial_submissions",
+            "validate_submissions",
+            "view_asset",
+            "view_submissions",
+        ]
+
+        if permission not in valid_permissions:
+            raise ValueError(
+                "Permission must be one of the following: " + str(valid_permissions)
+            )
+
+        data = {
+            "user": f"{self.url}/api/v{self.api_version}/users/{user}/",
+            "permission": f"{self.url}/api/v{self.api_version}/permissions/{permission}/",
+        }
+
+        url = f"{self.url}/api/v{self.api_version}/assets/{uid}/permission-assignments.json"
+        res = requests.post(url=url, headers=self.headers, data=data)
+
+        if res.status_code != 201:
+            raise requests.HTTPError(res.text)
+
+    def fetch_users_with_access(self, uid: str):
+        """
+        Fetch the list of users who have access to a specific form, extracting usernames from URLs.
+        """
+        url_permissions = f"{self.url}/api/v{self.api_version}/assets/{uid}/permission-assignments/"
+        res = requests.get(url=url_permissions, headers=self.headers)
+
+        if res.status_code != 200:
+            raise requests.HTTPError(f"Failed to fetch permissions: {res.text}")
+
+        permissions = res.json()
+        users_with_access = set()
+
+        for permission in permissions:
+            user_url = permission.get('user')
+            if user_url:
+                username = user_url.rstrip('/').split('/')[-1]  # Split to get the username from the url
+                users_with_access.add(username)
+
+        return list(users_with_access)