From 0e8d3b76c180adfd0c64b8edf016d0ac0bb13938 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Tue, 8 Nov 2022 08:19:09 +0700
Subject: [PATCH 01/17] better wording for scheduler frequency, #358

---
 docs/Settings.md                                | 2 +-
 tubearchivist/home/templates/home/settings.html | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/docs/Settings.md b/docs/Settings.md
index 72e69e7..0bc920d 100644
--- a/docs/Settings.md
+++ b/docs/Settings.md
@@ -102,7 +102,7 @@ Examples:
 NOTE:
 - Changes in the scheduler settings require a container restart to take effect.
 - Cron format as *number*/*number* are none standard cron and are not supported by the scheduler, for example **0 0/12 \*** is invalid, use **0 \*/12 \*** instead.
-- Avoid an unnecessary frequent schedule to not get blocked by YouTube. For that reason * or wildcards for minutes are not supported.
+- Avoid an unnecessary frequent schedule to not get blocked by YouTube. For that reason, the scheduler doesn't support schedules that trigger more than once per hour.
 
 ## Rescan Subscriptions
 That's the equivalent task as run from the downloads page looking through your channel and playlist and add missing videos to the download queue.
diff --git a/tubearchivist/home/templates/home/settings.html b/tubearchivist/home/templates/home/settings.html
index dd94879..049f79c 100644
--- a/tubearchivist/home/templates/home/settings.html
+++ b/tubearchivist/home/templates/home/settings.html
@@ -186,7 +186,7 @@
             <p>Note:</p>
             <ul>
                 <li>Changes in the scheduler settings require a container restart to take effect.</li>
-                <li>Avoid an unnecessary frequent schedule to not get blocked by YouTube. For that reason <i>*</i> or <i>wildcard</i> for minutes is not supported.</li>
+                <li>Avoid an unnecessary frequent schedule to not get blocked by YouTube. For that reason, the scheduler doesn't support schedules that trigger more than once per hour.</li>
             </ul>
         </div>
     </div>

From e912cf7fb62941d87420dc47ccf96a312c70bba6 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Thu, 10 Nov 2022 09:53:49 +0700
Subject: [PATCH 02/17] rename to *common errors*, better issue template

---
 .github/ISSUE_TEMPLATE/BUG-REPORT.yml        | 4 +++-
 .github/ISSUE_TEMPLATE/INSTALLATION-HELP.yml | 2 +-
 README.md                                    | 4 ++--
 3 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/.github/ISSUE_TEMPLATE/BUG-REPORT.yml b/.github/ISSUE_TEMPLATE/BUG-REPORT.yml
index dd0b723..b9f051a 100644
--- a/.github/ISSUE_TEMPLATE/BUG-REPORT.yml
+++ b/.github/ISSUE_TEMPLATE/BUG-REPORT.yml
@@ -11,10 +11,12 @@ body:
   - type: checkboxes
     id: latest
     attributes:
-      label: Latest and Greatest
+      label: I've read the documentation:
       options:
         - label: I'm running the latest version of Tube Archivist and have read the [release notes](https://github.com/tubearchivist/tubearchivist/releases/latest).
           required: true
+        - label: I have read through the [wiki](https://github.com/tubearchivist/tubearchivist/wiki) and the [readme](https://github.com/tubearchivist/tubearchivist#installing-and-updating), particularly the [common errors](https://github.com/tubearchivist/tubearchivist#common-errors) section.
+          required: true
 
   - type: input
     id: os
diff --git a/.github/ISSUE_TEMPLATE/INSTALLATION-HELP.yml b/.github/ISSUE_TEMPLATE/INSTALLATION-HELP.yml
index 8459327..07519dc 100644
--- a/.github/ISSUE_TEMPLATE/INSTALLATION-HELP.yml
+++ b/.github/ISSUE_TEMPLATE/INSTALLATION-HELP.yml
@@ -15,7 +15,7 @@ body:
       options:
         - label: I have read and understand the [installation instructions](https://github.com/tubearchivist/tubearchivist#installing-and-updating).
           required: true
-        - label: My issue is not described in the [potential pitfalls](https://github.com/tubearchivist/tubearchivist#potential-pitfalls) section.
+        - label: My issue is not described in the [common errors](https://github.com/tubearchivist/tubearchivist#common-errors) section.
           required: true
 
   - type: input
diff --git a/README.md b/README.md
index 4a406d7..bf029fd 100644
--- a/README.md
+++ b/README.md
@@ -16,7 +16,7 @@
 * [Extended Universe](#extended-universe)
 * [Installing and updating](#installing-and-updating)
 * [Getting Started](#getting-started)
-* [Potential pitfalls](#potential-pitfalls)
+* [Common Errors](#common-errors)
 * [Roadmap](#roadmap)
 * [Known limitations](#known-limitations)
 * [Donate](#donate)
@@ -165,7 +165,7 @@ You will see the current version number of **Tube Archivist** in the footer of t
 
 There is a Helm Chart available at https://github.com/insuusvenerati/helm-charts. Mostly self-explanatory but feel free to ask questions in the discord / subreddit.
 
-## Potential pitfalls
+## Common Errors
 ### vm.max_map_count
 **Elastic Search** in Docker requires the kernel setting of the host machine `vm.max_map_count` to be set to at least 262144.
 

From 5b7e3e877b37750a2d9dffe85ac22268b96ce4ee Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Sat, 12 Nov 2022 11:48:48 +0700
Subject: [PATCH 03/17] implement basic comment archive

---
 tubearchivist/home/src/es/index_mapping.json |  66 ++++++++++++
 tubearchivist/home/src/index/comments.py     | 101 +++++++++++++++++++
 2 files changed, 167 insertions(+)
 create mode 100644 tubearchivist/home/src/index/comments.py

diff --git a/tubearchivist/home/src/es/index_mapping.json b/tubearchivist/home/src/es/index_mapping.json
index f023eef..bed6973 100644
--- a/tubearchivist/home/src/es/index_mapping.json
+++ b/tubearchivist/home/src/es/index_mapping.json
@@ -460,6 +460,72 @@
                 },
                 "number_of_replicas": "0"
             }
+        },
+        {
+            "index_name": "comments",
+            "expected_map": {
+                "youtube_id": {
+                    "type": "keyword"
+                },
+                "comment_last_refresh": {
+                    "type": "date"
+                },
+                "comment_comments": {
+                    "properties": {
+                        "comment_id": {
+                            "type": "keyword"
+                        },
+                        "comment_text": {
+                            "type" : "text"
+                        },
+                        "comment_timestamp": {
+                            "type": "date"
+                        },
+                        "comment_time_text": {
+                            "type" : "text"
+                        },
+                        "comment_likecount": {
+                            "type": "long"
+                        },
+                        "comment_is_favorited": {
+                            "type": "boolean"
+                        },
+                        "comment_author": {
+                            "type": "text",
+                            "fields": {
+                                "keyword": {
+                                    "type": "keyword",
+                                    "ignore_above": 256,
+                                    "normalizer": "to_lower"
+                                }
+                            }
+                        },
+                        "comment_author_id": {
+                            "type": "keyword"
+                        },
+                        "comment_author_thumbnail": {
+                            "type": "keyword"
+                        },
+                        "comment_author_is_uploader": {
+                            "type": "boolean"
+                        },
+                        "comment_parent": {
+                            "type": "keyword"
+                        }
+                    }
+                }
+            },
+            "expected_set": {
+                "analysis": {
+                    "normalizer": {
+                        "to_lower": {
+                            "type": "custom",
+                            "filter": ["lowercase"]
+                        }
+                    }
+                },
+                "number_of_replicas": "0"
+            }
         }
     ]
 }
\ No newline at end of file
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
new file mode 100644
index 0000000..05f9a6e
--- /dev/null
+++ b/tubearchivist/home/src/index/comments.py
@@ -0,0 +1,101 @@
+"""
+Functionality:
+- Download comments
+- Index comments in ES
+- Retrieve comments from ES
+"""
+
+from datetime import datetime
+
+from home.src.download.yt_dlp_base import YtWrap
+from home.src.es.connect import ElasticWrap
+
+
+class Comments:
+    """hold all comments functionality"""
+
+    def __init__(self, youtube_id):
+        self.youtube_id = youtube_id
+        self.es_path = f"ta_comments/_doc/{youtube_id}"
+        self.max_comments = "all,100,all,30"
+        self.json_data = False
+
+    def build_json(self):
+        """build json document for es"""
+        comments_raw = self.get_comments()
+        comments_format = self.format_comments(comments_raw)
+
+        self.json_data = {
+            "youtube_id": self.youtube_id,
+            "comment_last_refresh": int(datetime.now().strftime("%s")),
+            "comment_comments": comments_format,
+        }
+
+    def build_yt_obs(self):
+        """
+        get extractor config
+        max-comments,max-parents,max-replies,max-replies-per-thread
+        """
+        max_comments_list = [i.strip() for i in self.max_comments.split(",")]
+        comment_sort = "top"
+
+        yt_obs = {
+            "skip_download": True,
+            "quiet": False,
+            "getcomments": True,
+            "extractor_args": {
+                "youtube": {
+                    "max_comments": max_comments_list,
+                    "comment_sort": [comment_sort],
+                }
+            },
+        }
+
+        return yt_obs
+
+    def get_comments(self):
+        """get comments from youtube"""
+        print(f"comments: get comments with format {self.max_comments}")
+        yt_obs = self.build_yt_obs()
+        info_json = YtWrap(yt_obs).extract(self.youtube_id)
+        comments_raw = info_json.get("comments")
+        return comments_raw
+
+    def format_comments(self, comments_raw):
+        """process comments to match format"""
+        comments = []
+
+        for comment in comments_raw:
+            cleaned_comment = self.clean_comment(comment)
+            comments.append(cleaned_comment)
+
+        return comments
+
+    def clean_comment(self, comment):
+        """parse metadata from comment for indexing"""
+        time_text_datetime = datetime.utcfromtimestamp(comment["timestamp"])
+        time_text = time_text_datetime.strftime("%Y-%m-%d %H:%M:%S")
+
+        cleaned_comment = {
+            "comment_id": comment["id"],
+            "comment_text": comment["text"].replace("\xa0", ""),
+            "comment_timestamp": comment["timestamp"],
+            "comment_time_text": time_text,
+            "comment_likecount": comment["like_count"],
+            "comment_is_favorited": comment["is_favorited"],
+            "comment_author": comment["author"],
+            "comment_author_id": comment["author_id"],
+            "comment_author_thumbnail": comment["author_thumbnail"],
+            "comment_author_is_uploader": comment["author_is_uploader"],
+            "comment_parent": comment["parent"],
+        }
+
+        return cleaned_comment
+
+    def upload_comments(self):
+        """upload comments to es"""
+        _, _ = ElasticWrap(self.es_path).put(self.json_data)
+
+    def delete_comments(self):
+        """delete comments from es"""
+        _, _ = ElasticWrap(self.es_path).delete()

From f6b6185fb213bc055abf9fdd1f32e2f008c3a94a Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Sat, 12 Nov 2022 12:40:14 +0700
Subject: [PATCH 04/17] rename ta_comment index, implement get comments from es

---
 tubearchivist/home/src/es/index_mapping.json |  2 +-
 tubearchivist/home/src/index/comments.py     | 15 ++++++++++++---
 2 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/tubearchivist/home/src/es/index_mapping.json b/tubearchivist/home/src/es/index_mapping.json
index bed6973..4a325ea 100644
--- a/tubearchivist/home/src/es/index_mapping.json
+++ b/tubearchivist/home/src/es/index_mapping.json
@@ -462,7 +462,7 @@
             }
         },
         {
-            "index_name": "comments",
+            "index_name": "comment",
             "expected_map": {
                 "youtube_id": {
                     "type": "keyword"
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index 05f9a6e..a7423ee 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -16,13 +16,13 @@ class Comments:
 
     def __init__(self, youtube_id):
         self.youtube_id = youtube_id
-        self.es_path = f"ta_comments/_doc/{youtube_id}"
+        self.es_path = f"ta_comment/_doc/{youtube_id}"
         self.max_comments = "all,100,all,30"
         self.json_data = False
 
     def build_json(self):
         """build json document for es"""
-        comments_raw = self.get_comments()
+        comments_raw = self.get_yt_comments()
         comments_format = self.format_comments(comments_raw)
 
         self.json_data = {
@@ -53,7 +53,7 @@ class Comments:
 
         return yt_obs
 
-    def get_comments(self):
+    def get_yt_comments(self):
         """get comments from youtube"""
         print(f"comments: get comments with format {self.max_comments}")
         yt_obs = self.build_yt_obs()
@@ -99,3 +99,12 @@ class Comments:
     def delete_comments(self):
         """delete comments from es"""
         _, _ = ElasticWrap(self.es_path).delete()
+
+    def get_es_comments(self):
+        """get comments from ES"""
+        response, statuscode = ElasticWrap(self.es_path).get()
+        if statuscode == 404:
+            print(f"comments: not found {self.youtube_id}")
+            return False
+
+        return response

From fb046bed5bd1f897eddde5e4a4db2a5b2c59d6bd Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Sat, 12 Nov 2022 12:42:08 +0700
Subject: [PATCH 05/17] [API] implement get comments API view

---
 tubearchivist/api/README.md               |  4 ++++
 tubearchivist/api/src/search_processor.py | 16 ++++++++++++++++
 tubearchivist/api/urls.py                 |  6 ++++++
 tubearchivist/api/views.py                | 16 ++++++++++++++++
 4 files changed, 42 insertions(+)

diff --git a/tubearchivist/api/README.md b/tubearchivist/api/README.md
index 6e5efb4..593089d 100644
--- a/tubearchivist/api/README.md
+++ b/tubearchivist/api/README.md
@@ -12,6 +12,7 @@ Note:
 **Video**
 - [Video List](#video-list-view)
 - [Video Single](#video-item-view)
+- [Video Comments](#video-comment-view)
 - [Video Single Progress](#video-progress-view)
 - [Video Single Sponsorblock](#sponsor-block-view) WIP
 
@@ -78,6 +79,9 @@ Pass page number as a query parameter: `page=2`. Defaults to *0*, `page=1` is re
 ## Video Item View
 /api/video/\<video_id>/
 
+## Video Comment View
+/api/video/\<video_id>/comment/  
+
 ## Video Progress View
 /api/video/\<video_id>/progress  
 
diff --git a/tubearchivist/api/src/search_processor.py b/tubearchivist/api/src/search_processor.py
index 7a41163..7b594f6 100644
--- a/tubearchivist/api/src/search_processor.py
+++ b/tubearchivist/api/src/search_processor.py
@@ -48,6 +48,8 @@ class SearchProcess:
             processed = self._process_playlist(result["_source"])
         if index == "ta_download":
             processed = self._process_download(result["_source"])
+        if index == "ta_comment":
+            processed = self._process_comment(result["_source"])
 
         return processed
 
@@ -123,3 +125,17 @@ class SearchProcess:
             }
         )
         return dict(sorted(download_dict.items()))
+
+    def _process_comment(self, comment_dict):
+        """run on all comments, create reply thread"""
+        all_comments = comment_dict["comment_comments"]
+        processed_comments = []
+
+        for comment in all_comments:
+            if comment["comment_parent"] == "root":
+                comment.update({"comment_replies": []})
+                processed_comments.append(comment)
+            else:
+                processed_comments[-1]["comment_replies"].append(comment)
+
+        return processed_comments
diff --git a/tubearchivist/api/urls.py b/tubearchivist/api/urls.py
index e84ec05..7fb48a0 100644
--- a/tubearchivist/api/urls.py
+++ b/tubearchivist/api/urls.py
@@ -18,6 +18,7 @@ from api.views import (
     TaskApiView,
     VideoApiListView,
     VideoApiView,
+    VideoCommentView,
     VideoProgressView,
     VideoSponsorView,
 )
@@ -41,6 +42,11 @@ urlpatterns = [
         VideoProgressView.as_view(),
         name="api-video-progress",
     ),
+    path(
+        "video/<slug:video_id>/comment/",
+        VideoCommentView.as_view(),
+        name="api-video-comment",
+    ),
     path(
         "video/<slug:video_id>/sponsor/",
         VideoSponsorView.as_view(),
diff --git a/tubearchivist/api/views.py b/tubearchivist/api/views.py
index 2574db6..dab62e3 100644
--- a/tubearchivist/api/views.py
+++ b/tubearchivist/api/views.py
@@ -145,6 +145,22 @@ class VideoProgressView(ApiBaseView):
         return Response(self.response)
 
 
+class VideoCommentView(ApiBaseView):
+    """resolves to /api/video/<video_id>/comment/
+    handle video comments
+    GET: return all comments from video with reply threads
+    """
+
+    search_base = "ta_comment/_doc/"
+
+    def get(self, request, video_id):
+        """get video comments"""
+        # pylint: disable=unused-argument
+        self.get_document(video_id)
+
+        return Response(self.response, status=self.status_code)
+
+
 class VideoSponsorView(ApiBaseView):
     """resolves to /api/video/<video_id>/sponsor/
     handle sponsor block integration

From 79d134cea895c7a77d73c0a6a794c89a38e601c8 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Mon, 14 Nov 2022 11:59:59 +0700
Subject: [PATCH 06/17] clean format comments date string

---
 tubearchivist/home/src/index/comments.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index a7423ee..e06b973 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -74,7 +74,13 @@ class Comments:
     def clean_comment(self, comment):
         """parse metadata from comment for indexing"""
         time_text_datetime = datetime.utcfromtimestamp(comment["timestamp"])
-        time_text = time_text_datetime.strftime("%Y-%m-%d %H:%M:%S")
+
+        if time_text_datetime.hour == 0 and time_text_datetime.minute == 0:
+            format_string = "%Y-%m-%d"
+        else:
+            format_string = "%Y-%m-%d %H:%M"
+
+        time_text = time_text_datetime.strftime(format_string)
 
         cleaned_comment = {
             "comment_id": comment["id"],

From ad016df10504346b8733e7bc6c047d422a8c103d Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Mon, 14 Nov 2022 16:31:49 +0700
Subject: [PATCH 07/17] implement comment frontend

---
 tubearchivist/home/templates/home/video.html |  5 ++
 tubearchivist/static/css/style.css           | 37 +++++++++-
 tubearchivist/static/img/icon-heart.svg      |  8 ++
 tubearchivist/static/script.js               | 77 +++++++++++++++++++-
 4 files changed, 125 insertions(+), 2 deletions(-)
 create mode 100644 tubearchivist/static/img/icon-heart.svg

diff --git a/tubearchivist/home/templates/home/video.html b/tubearchivist/home/templates/home/video.html
index 705f6c6..df53a71 100644
--- a/tubearchivist/home/templates/home/video.html
+++ b/tubearchivist/home/templates/home/video.html
@@ -123,6 +123,11 @@
             </div>
         {% endfor %}
     {% endif %}
+    <div class="comments-section">
+        <h3>Comments</h3>
+        <div id="comments-list" class="comments-list">
+        </div>
+    </div>
 </div>
 <script>
     var videoData = getVideoData('{{ video.youtube_id }}');
diff --git a/tubearchivist/static/css/style.css b/tubearchivist/static/css/style.css
index f20d997..8907bfb 100644
--- a/tubearchivist/static/css/style.css
+++ b/tubearchivist/static/css/style.css
@@ -619,7 +619,8 @@ video:-webkit-full-screen {
     margin-top: 1rem;
 }
 
-.description-box {
+.description-box,
+.comments-section {
     margin-top: 1rem;
     padding: 15px;
     background-color: var(--highlight-bg);
@@ -778,6 +779,10 @@ video:-webkit-full-screen {
     margin-left: 5px;
 }
 
+.thumb-icon {
+    display: flex;
+}
+
 .thumb-icon img,
 .rating-stars img {
     width: 20px;
@@ -819,6 +824,36 @@ video:-webkit-full-screen {
     width: 100%;
 }
 
+.comment-box {
+    padding-bottom: 1rem;
+}
+
+.comments-replies {
+    padding-left: 3rem;
+}
+
+.comment-highlight {
+    background-color: var(--main-font);
+    padding: 3px;
+    color: var(--accent-font-dark);
+    font-family: Sen-bold, sans-serif;
+    width: fit-content;
+}
+
+.comment-meta {
+    display: flex;
+}
+
+.space-carrot {
+    margin: 0 10px;
+}
+
+.comment-like img {
+    width: 20px;
+    margin-left: 5px;
+    filter: var(--img-filter-error);
+}
+
 /* multi search page */
 .multi-search-box {
     padding-right: 20px;
diff --git a/tubearchivist/static/img/icon-heart.svg b/tubearchivist/static/img/icon-heart.svg
new file mode 100644
index 0000000..8a26e16
--- /dev/null
+++ b/tubearchivist/static/img/icon-heart.svg
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="utf-8"?>
+<!-- Generator: Adobe Illustrator 26.5.0, SVG Export Plug-In . SVG Version: 6.00 Build 0)  -->
+<svg version="1.1" id="Layer_1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
+	 viewBox="0 0 500 500" style="enable-background:new 0 0 500 500;" xml:space="preserve">
+<path d="M499.9,159L499.9,159c0.1-1.7,0.1-3.4,0.1-5.2c0-69.5-58.6-129.7-130.9-129.7c-52.9,0-98.4,34-119,77.4h0
+	c-20.7-43.4-66.2-77.4-119-77.4C58.6,24.1,0,84.4,0,153.9c0,1.7,0.1,3.4,0.1,5.2h0c0,0-7.4,82.6,84.5,172.7
+	c41.8,41.9,88.5,81.6,165.4,144.1c76.9-62.5,123.6-102.3,165.4-144.1C507.2,241.6,499.9,159,499.9,159z"/>
+</svg>
diff --git a/tubearchivist/static/script.js b/tubearchivist/static/script.js
index 8a98092..47a28de 100644
--- a/tubearchivist/static/script.js
+++ b/tubearchivist/static/script.js
@@ -287,7 +287,7 @@ function resetToken() {
   document.getElementById('text-reveal').replaceWith(message);
 }
 
-// restore from snapshot 
+// restore from snapshot
 function restoreSnapshot(snapshotId) {
   console.log('restore ' + snapshotId);
   let apiEndpoint = '/api/snapshot/' + snapshotId + '/';
@@ -1104,6 +1104,81 @@ function createFulltext(fullText) {
   return fullTextDiv;
 }
 
+function getComments(videoId) {
+  let apiEndpoint = '/api/video/' + videoId + '/comment/';
+  let response = apiRequest(apiEndpoint, 'GET');
+  let allComments = response.data;
+
+  writeComments(allComments);
+}
+
+function writeComments(allComments) {
+  let commentsListBox = document.getElementById('comments-list');
+  for (let i = 0; i < allComments.length; i++) {
+    const rootComment = allComments[i];
+
+    let commentBox = createCommentBox(rootComment, true);
+
+    // add replies to commentBox
+    if (rootComment.comment_replies) {
+      let commentReplyBox = document.createElement('div');
+      commentReplyBox.setAttribute('class', 'comments-replies');
+      for (let j = 0; j < rootComment.comment_replies.length; j++) {
+        const commentReply = rootComment.comment_replies[j];
+        let commentReplyDiv = createCommentBox(commentReply, false);
+        commentReplyBox.appendChild(commentReplyDiv);
+      }
+      if (rootComment.comment_replies.length > 0) {
+        commentBox.appendChild(commentReplyBox);
+      }
+    }
+    commentsListBox.appendChild(commentBox);
+  }
+}
+
+function createCommentBox(comment, isRoot) {
+  let commentBox = document.createElement('div');
+  commentBox.setAttribute('class', 'comment-box');
+
+  let commentClass;
+  if (isRoot) {
+    commentClass = 'root-comment';
+  } else {
+    commentClass = 'reply-comment';
+  }
+
+  commentBox.classList.add = commentClass;
+
+  let commentAuthor = document.createElement('h3');
+  commentAuthor.innerText = comment.comment_author;
+  if (comment.comment_author_is_uploader) {
+    commentAuthor.setAttribute('class', 'comment-highlight');
+  }
+  commentBox.appendChild(commentAuthor);
+
+  let commentText = document.createElement('p');
+  commentText.innerText = comment.comment_text;
+  commentBox.appendChild(commentText);
+
+  const spacer = '<span class="space-carrot">|</span>';
+  let commentMeta = document.createElement('div');
+  commentMeta.setAttribute('class', 'comment-meta');
+
+  commentMeta.innerHTML = `<span>${comment.comment_time_text}</span>`;
+
+  if (comment.comment_likecount > 0) {
+    commentMeta.innerHTML += `${spacer}<span class="thumb-icon"><img src="/static/img/icon-thumb.svg"> ${comment.comment_likecount}</span>`;
+  }
+
+  if (comment.comment_is_favorited) {
+    commentMeta.innerHTML += `${spacer}<span class="comment-like"><img src="/static/img/icon-heart.svg"></span>`;
+  }
+
+  commentBox.appendChild(commentMeta);
+
+  return commentBox;
+}
+
 // generic
 
 function sendPost(payload) {

From 11c122cba30625b23f93aa7cf4bf3c57ed386905 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 08:58:25 +0700
Subject: [PATCH 08/17] finetune comments icon position

---
 tubearchivist/static/css/style.css | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tubearchivist/static/css/style.css b/tubearchivist/static/css/style.css
index 8907bfb..6d5cc23 100644
--- a/tubearchivist/static/css/style.css
+++ b/tubearchivist/static/css/style.css
@@ -786,7 +786,7 @@ video:-webkit-full-screen {
 .thumb-icon img,
 .rating-stars img {
     width: 20px;
-    margin: 0;
+    margin: 0 5px;
     filter: var(--img-filter);
 }
 
@@ -830,6 +830,7 @@ video:-webkit-full-screen {
 
 .comments-replies {
     padding-left: 3rem;
+    margin-top: 1rem;
 }
 
 .comment-highlight {
@@ -845,7 +846,7 @@ video:-webkit-full-screen {
 }
 
 .space-carrot {
-    margin: 0 10px;
+    margin: 0 5px;
 }
 
 .comment-like img {

From 172ced7129e802a55f3fb23a9300873888e956b9 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 08:59:04 +0700
Subject: [PATCH 09/17] configure comments extraction

---
 tubearchivist/home/config.json                 |  2 ++
 tubearchivist/home/src/frontend/forms.py       | 10 ++++++++++
 tubearchivist/home/src/index/comments.py       | 18 +++++++++++++-----
 .../home/templates/home/settings.html          | 18 ++++++++++++++++++
 4 files changed, 43 insertions(+), 5 deletions(-)

diff --git a/tubearchivist/home/config.json b/tubearchivist/home/config.json
index a953a49..c8450d0 100644
--- a/tubearchivist/home/config.json
+++ b/tubearchivist/home/config.json
@@ -27,6 +27,8 @@
         "subtitle": false,
         "subtitle_source": false,
         "subtitle_index": false,
+        "comment_max": false,
+        "comment_sort": "top",
         "cookie_import": false,
         "throttledratelimit": false,
         "integrate_ryd": false,
diff --git a/tubearchivist/home/src/frontend/forms.py b/tubearchivist/home/src/frontend/forms.py
index 1e4365c..79cecbe 100644
--- a/tubearchivist/home/src/frontend/forms.py
+++ b/tubearchivist/home/src/frontend/forms.py
@@ -92,6 +92,12 @@ class ApplicationSettingsForm(forms.Form):
         ("1", "enable subtitle index"),
     ]
 
+    COMMENT_SORT_CHOICES = [
+        ("", "-- change comments sort settings --"),
+        ("top", "sort comments by top"),
+        ("new", "sort comments by new"),
+    ]
+
     COOKIE_IMPORT_CHOICES = [
         ("", "-- change cookie settings"),
         ("0", "disable cookie"),
@@ -120,6 +126,10 @@ class ApplicationSettingsForm(forms.Form):
     downloads_subtitle_index = forms.ChoiceField(
         widget=forms.Select, choices=SUBTITLE_INDEX_CHOICES, required=False
     )
+    downloads_comment_max = forms.CharField(required=False)
+    downloads_comment_sort = forms.ChoiceField(
+        widget=forms.Select, choices=COMMENT_SORT_CHOICES, required=False
+    )
     downloads_cookie_import = forms.ChoiceField(
         widget=forms.Select, choices=COOKIE_IMPORT_CHOICES, required=False
     )
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index e06b973..c907cb5 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -9,19 +9,21 @@ from datetime import datetime
 
 from home.src.download.yt_dlp_base import YtWrap
 from home.src.es.connect import ElasticWrap
+from home.src.ta.config import AppConfig
 
 
 class Comments:
     """hold all comments functionality"""
 
-    def __init__(self, youtube_id):
+    def __init__(self, youtube_id, config=False):
         self.youtube_id = youtube_id
         self.es_path = f"ta_comment/_doc/{youtube_id}"
-        self.max_comments = "all,100,all,30"
         self.json_data = False
+        self.config = config
 
     def build_json(self):
         """build json document for es"""
+        self._check_config()
         comments_raw = self.get_yt_comments()
         comments_format = self.format_comments(comments_raw)
 
@@ -31,13 +33,19 @@ class Comments:
             "comment_comments": comments_format,
         }
 
+    def _check_config(self):
+        """read config if not attached"""
+        if not self.config:
+            self.config = AppConfig().config
+
     def build_yt_obs(self):
         """
         get extractor config
         max-comments,max-parents,max-replies,max-replies-per-thread
         """
-        max_comments_list = [i.strip() for i in self.max_comments.split(",")]
-        comment_sort = "top"
+        max_comments = self.config["downloads"]["comment_max"]
+        max_comments_list = [i.strip() for i in max_comments.split(",")]
+        comment_sort = self.config["downloads"]["comment_sort"]
 
         yt_obs = {
             "skip_download": True,
@@ -55,7 +63,7 @@ class Comments:
 
     def get_yt_comments(self):
         """get comments from youtube"""
-        print(f"comments: get comments with format {self.max_comments}")
+        print("comments: get comments")
         yt_obs = self.build_yt_obs()
         info_json = YtWrap(yt_obs).extract(self.youtube_id)
         comments_raw = info_json.get("comments")
diff --git a/tubearchivist/home/templates/home/settings.html b/tubearchivist/home/templates/home/settings.html
index 049f79c..b02e1bd 100644
--- a/tubearchivist/home/templates/home/settings.html
+++ b/tubearchivist/home/templates/home/settings.html
@@ -114,6 +114,24 @@
                 {{ app_form.downloads_subtitle_index }}
             </div>
         </div>
+        <div class="settings-group">
+            <h2 id="comments">Comments</h2>
+            <div class="settings-item">
+                <p>Download and index comments: <span class="settings-current">{{ config.downloads.comment_max }}</span><br>
+                <i>Follow the yt-dlp max_comments documentation, <a href="https://github.com/yt-dlp/yt-dlp#youtube" target="_blank">max-comments,max-parents,max-replies,max-replies-per-thread</a>:</i><br>
+                <p>Example configurations:</p>
+                <ul>
+                    <li><span class="settings-current">all,100,all,30</span>: Get 100 max-parents and 30 max-replies-per-thread.</li>
+                    <li><span class="settings-current">1000,all,all,50</span>: Get a total of 1000 comments over all, 50 replies per thread.</li>
+                </ul>
+                {{ app_form.downloads_comment_max }}</p>
+            </div>
+            <div class="settings-item">
+                <p>Selected comment sort method: <span class="settings-current">{{ config.downloads.comment_sort }}</span><br>
+                <i>Select how many comments and threads to download:</i><br>
+                {{ app_form.downloads_comment_sort }}</p>
+            </div>
+        </div>
         <div class="settings-group">
             <h2 id="format">Cookie</h2>
             <div class="settings-item">

From 939cd7fb624812d343a4240d7ea8bb8ff90dd9de Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 09:22:58 +0700
Subject: [PATCH 10/17] index comments as a DownloadPostProcess

---
 tubearchivist/home/src/download/yt_dlp_handler.py | 14 ++++++++++++++
 tubearchivist/home/src/index/comments.py          |  2 +-
 2 files changed, 15 insertions(+), 1 deletion(-)

diff --git a/tubearchivist/home/src/download/yt_dlp_handler.py b/tubearchivist/home/src/download/yt_dlp_handler.py
index 4dcfe02..267b822 100644
--- a/tubearchivist/home/src/download/yt_dlp_handler.py
+++ b/tubearchivist/home/src/download/yt_dlp_handler.py
@@ -15,6 +15,7 @@ from home.src.download.subscriptions import PlaylistSubscription
 from home.src.download.yt_dlp_base import CookieHandler, YtWrap
 from home.src.es.connect import ElasticWrap, IndexPaginate
 from home.src.index.channel import YoutubeChannel
+from home.src.index.comments import Comments
 from home.src.index.playlist import YoutubePlaylist
 from home.src.index.video import YoutubeVideo, index_new_video
 from home.src.ta.config import AppConfig
@@ -39,6 +40,7 @@ class DownloadPostProcess:
         self.auto_delete_all()
         self.auto_delete_overwrites()
         self.validate_playlists()
+        self.get_comments()
 
     def auto_delete_all(self):
         """handle auto delete"""
@@ -139,6 +141,16 @@ class DownloadPostProcess:
 
         RedisArchivist().set_message(key, mess_dict, expire=expire)
 
+    def get_comments(self):
+        """get comments from youtube"""
+        if not self.download.config["downloads"]["comment_max"]:
+            return
+
+        for video_id in self.download.videos:
+            comment = Comments(video_id)
+            comment.build_json()
+            comment.upload_comments()
+
 
 class VideoDownloader:
     """
@@ -155,6 +167,7 @@ class VideoDownloader:
         self.config = AppConfig().config
         self._build_obs()
         self.channels = set()
+        self.videos = set()
 
     def run_queue(self):
         """setup download queue in redis loop until no more items"""
@@ -187,6 +200,7 @@ class VideoDownloader:
                 youtube_id, video_overwrites=self.video_overwrites
             )
             self.channels.add(vid_dict["channel"]["channel_id"])
+            self.videos.add(vid_dict["youtube_id"])
             mess_dict = {
                 "status": self.MSG,
                 "level": "info",
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index c907cb5..fd5fb9c 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -23,6 +23,7 @@ class Comments:
 
     def build_json(self):
         """build json document for es"""
+        print(f"{self.youtube_id}: get comments")
         self._check_config()
         comments_raw = self.get_yt_comments()
         comments_format = self.format_comments(comments_raw)
@@ -63,7 +64,6 @@ class Comments:
 
     def get_yt_comments(self):
         """get comments from youtube"""
-        print("comments: get comments")
         yt_obs = self.build_yt_obs()
         info_json = YtWrap(yt_obs).extract(self.youtube_id)
         comments_raw = info_json.get("comments")

From 2818bd5d5224e0bdd1358de63c415966a299cc8b Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 09:44:20 +0700
Subject: [PATCH 11/17] add comments to video template if available

---
 tubearchivist/home/src/es/index_mapping.json |  3 +++
 tubearchivist/home/src/index/comments.py     | 15 ++++++++++++---
 tubearchivist/home/templates/home/video.html | 11 +++++++----
 3 files changed, 22 insertions(+), 7 deletions(-)

diff --git a/tubearchivist/home/src/es/index_mapping.json b/tubearchivist/home/src/es/index_mapping.json
index 4a325ea..79f1d81 100644
--- a/tubearchivist/home/src/es/index_mapping.json
+++ b/tubearchivist/home/src/es/index_mapping.json
@@ -193,6 +193,9 @@
                         }
                     }
                 },
+                "comment_count": {
+                    "type": "long"
+                },
                 "stats" : {
                     "properties" : {
                         "average_rating" : {
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index fd5fb9c..b7694cf 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -20,18 +20,19 @@ class Comments:
         self.es_path = f"ta_comment/_doc/{youtube_id}"
         self.json_data = False
         self.config = config
+        self.comments_format = False
 
     def build_json(self):
         """build json document for es"""
         print(f"{self.youtube_id}: get comments")
         self._check_config()
         comments_raw = self.get_yt_comments()
-        comments_format = self.format_comments(comments_raw)
+        self.format_comments(comments_raw)
 
         self.json_data = {
             "youtube_id": self.youtube_id,
             "comment_last_refresh": int(datetime.now().strftime("%s")),
-            "comment_comments": comments_format,
+            "comment_comments": self.comments_format,
         }
 
     def _check_config(self):
@@ -77,7 +78,7 @@ class Comments:
             cleaned_comment = self.clean_comment(comment)
             comments.append(cleaned_comment)
 
-        return comments
+        self.comments_format = comments
 
     def clean_comment(self, comment):
         """parse metadata from comment for indexing"""
@@ -110,6 +111,14 @@ class Comments:
         """upload comments to es"""
         _, _ = ElasticWrap(self.es_path).put(self.json_data)
 
+        vid_path = f"ta_video/_update/{self.youtube_id}"
+        data = {
+            "doc": {
+                "comment_count": len(self.comments_format)
+            }
+        }
+        _, _ = ElasticWrap(vid_path).post(data=data)
+
     def delete_comments(self):
         """delete comments from es"""
         _, _ = ElasticWrap(self.es_path).delete()
diff --git a/tubearchivist/home/templates/home/video.html b/tubearchivist/home/templates/home/video.html
index df53a71..a5fc044 100644
--- a/tubearchivist/home/templates/home/video.html
+++ b/tubearchivist/home/templates/home/video.html
@@ -123,11 +123,14 @@
             </div>
         {% endfor %}
     {% endif %}
-    <div class="comments-section">
-        <h3>Comments</h3>
-        <div id="comments-list" class="comments-list">
+    {% if video.comment_count %}
+        <div class="comments-section">
+            <h3>Comments: {{video.comment_count}}</h3>
+            <div id="comments-list" class="comments-list">
+            </div>
         </div>
-    </div>
+        <script>getComments('{{ video.youtube_id }}')</script>
+    {% endif %}
 </div>
 <script>
     var videoData = getVideoData('{{ video.youtube_id }}');

From 31c967cc11ad974a97d8323868993489a6987f63 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 09:46:33 +0700
Subject: [PATCH 12/17] fix linter

---
 tubearchivist/home/src/index/comments.py | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index b7694cf..b92e609 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -112,11 +112,7 @@ class Comments:
         _, _ = ElasticWrap(self.es_path).put(self.json_data)
 
         vid_path = f"ta_video/_update/{self.youtube_id}"
-        data = {
-            "doc": {
-                "comment_count": len(self.comments_format)
-            }
-        }
+        data = {"doc": {"comment_count": len(self.comments_format)}}
         _, _ = ElasticWrap(vid_path).post(data=data)
 
     def delete_comments(self):

From b5ceb264ecc7f3b140d2214f4beaaa3075dfffdd Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 09:51:18 +0700
Subject: [PATCH 13/17] format comment like number

---
 tubearchivist/static/script.js | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tubearchivist/static/script.js b/tubearchivist/static/script.js
index 47a28de..7e760bf 100644
--- a/tubearchivist/static/script.js
+++ b/tubearchivist/static/script.js
@@ -1167,7 +1167,8 @@ function createCommentBox(comment, isRoot) {
   commentMeta.innerHTML = `<span>${comment.comment_time_text}</span>`;
 
   if (comment.comment_likecount > 0) {
-    commentMeta.innerHTML += `${spacer}<span class="thumb-icon"><img src="/static/img/icon-thumb.svg"> ${comment.comment_likecount}</span>`;
+    let numberFormatted = formatNumbers(comment.comment_likecount)
+    commentMeta.innerHTML += `${spacer}<span class="thumb-icon"><img src="/static/img/icon-thumb.svg"> ${numberFormatted}</span>`;
   }
 
   if (comment.comment_is_favorited) {

From a5be5a719b0e9198878d652d05003a9f862da2b1 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 10:31:09 +0700
Subject: [PATCH 14/17] reindex comments

---
 .../home/src/download/yt_dlp_handler.py       |  2 +-
 tubearchivist/home/src/index/comments.py      | 29 +++++++++++++++++--
 tubearchivist/home/src/index/reindex.py       |  6 ++--
 3 files changed, 32 insertions(+), 5 deletions(-)

diff --git a/tubearchivist/home/src/download/yt_dlp_handler.py b/tubearchivist/home/src/download/yt_dlp_handler.py
index 267b822..61a8c2f 100644
--- a/tubearchivist/home/src/download/yt_dlp_handler.py
+++ b/tubearchivist/home/src/download/yt_dlp_handler.py
@@ -147,7 +147,7 @@ class DownloadPostProcess:
             return
 
         for video_id in self.download.videos:
-            comment = Comments(video_id)
+            comment = Comments(video_id, config=self.download.config)
             comment.build_json()
             comment.upload_comments()
 
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index b92e609..b98a691 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -20,12 +20,17 @@ class Comments:
         self.es_path = f"ta_comment/_doc/{youtube_id}"
         self.json_data = False
         self.config = config
+        self.is_activated = False
         self.comments_format = False
 
     def build_json(self):
         """build json document for es"""
         print(f"{self.youtube_id}: get comments")
         self._check_config()
+
+        if not self.is_activated:
+            return
+
         comments_raw = self.get_yt_comments()
         self.format_comments(comments_raw)
 
@@ -40,6 +45,8 @@ class Comments:
         if not self.config:
             self.config = AppConfig().config
 
+        self.is_activated = bool(self.config["downloads"]["comment_max"])
+
     def build_yt_obs(self):
         """
         get extractor config
@@ -109,6 +116,9 @@ class Comments:
 
     def upload_comments(self):
         """upload comments to es"""
+        if not self.is_activated:
+            return
+
         _, _ = ElasticWrap(self.es_path).put(self.json_data)
 
         vid_path = f"ta_video/_update/{self.youtube_id}"
@@ -117,7 +127,7 @@ class Comments:
 
     def delete_comments(self):
         """delete comments from es"""
-        _, _ = ElasticWrap(self.es_path).delete()
+        _, _ = ElasticWrap(self.es_path).delete(refresh=True)
 
     def get_es_comments(self):
         """get comments from ES"""
@@ -126,4 +136,19 @@ class Comments:
             print(f"comments: not found {self.youtube_id}")
             return False
 
-        return response
+        return response.get("_source")
+
+    def reindex_comments(self):
+        """update comments from youtube"""
+        if not self.is_activated:
+            return
+
+        self.build_json()
+        es_comments = self.get_es_comments()
+
+        if not self.comments_format and es_comments["comment_comments"]:
+            # don't overwrite comments in es
+            return
+
+        self.delete_comments()
+        self.upload_comments()
diff --git a/tubearchivist/home/src/index/reindex.py b/tubearchivist/home/src/index/reindex.py
index ac0c363..b8b89f0 100644
--- a/tubearchivist/home/src/index/reindex.py
+++ b/tubearchivist/home/src/index/reindex.py
@@ -16,6 +16,7 @@ from home.src.download.yt_dlp_base import CookieHandler
 from home.src.download.yt_dlp_handler import VideoDownloader
 from home.src.es.connect import ElasticWrap
 from home.src.index.channel import YoutubeChannel
+from home.src.index.comments import Comments
 from home.src.index.playlist import YoutubePlaylist
 from home.src.index.video import YoutubeVideo
 from home.src.ta.config import AppConfig
@@ -147,8 +148,7 @@ class Reindex:
         if integrate_ryd:
             self._get_unrated_vids()
 
-    @staticmethod
-    def _reindex_single_video(youtube_id):
+    def _reindex_single_video(self, youtube_id):
         """refresh data for single video"""
         video = YoutubeVideo(youtube_id)
 
@@ -182,6 +182,8 @@ class Reindex:
         thumb_handler.delete_video_thumb()
         thumb_handler.download_video_thumb(video.json_data["vid_thumb_url"])
 
+        Comments(youtube_id, config=self.config).reindex_comments()
+
         return
 
     @staticmethod

From e590d456a157b3f34217e922a3f25c154e4117ce Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 10:47:48 +0700
Subject: [PATCH 15/17] delete comments when deleting video

---
 tubearchivist/home/src/index/comments.py | 5 +++--
 tubearchivist/home/src/index/video.py    | 9 +++++++++
 2 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index b98a691..3ad7c9e 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -26,7 +26,7 @@ class Comments:
     def build_json(self):
         """build json document for es"""
         print(f"{self.youtube_id}: get comments")
-        self._check_config()
+        self.check_config()
 
         if not self.is_activated:
             return
@@ -40,7 +40,7 @@ class Comments:
             "comment_comments": self.comments_format,
         }
 
-    def _check_config(self):
+    def check_config(self):
         """read config if not attached"""
         if not self.config:
             self.config = AppConfig().config
@@ -127,6 +127,7 @@ class Comments:
 
     def delete_comments(self):
         """delete comments from es"""
+        print(f"{self.youtube_id}: delete comments")
         _, _ = ElasticWrap(self.es_path).delete(refresh=True)
 
     def get_es_comments(self):
diff --git a/tubearchivist/home/src/index/video.py b/tubearchivist/home/src/index/video.py
index 9264080..7780c63 100644
--- a/tubearchivist/home/src/index/video.py
+++ b/tubearchivist/home/src/index/video.py
@@ -11,6 +11,7 @@ import requests
 from django.conf import settings
 from home.src.es.connect import ElasticWrap
 from home.src.index import channel as ta_channel
+from home.src.index import comments as ta_comments
 from home.src.index import playlist as ta_playlist
 from home.src.index.generic import YouTubeItem
 from home.src.index.subtitle import YoutubeSubtitle
@@ -302,6 +303,7 @@ class YoutubeVideo(YouTubeItem, YoutubeSubtitle):
         self.del_in_playlists()
         self.del_in_es()
         self.delete_subtitles()
+        self.delete_comments()
 
     def del_in_playlists(self):
         """remove downloaded in playlist"""
@@ -326,6 +328,13 @@ class YoutubeVideo(YouTubeItem, YoutubeSubtitle):
         print(f"{self.youtube_id}: delete subtitles")
         YoutubeSubtitle(self).delete(subtitles=subtitles)
 
+    def delete_comments(self):
+        """delete comments from es"""
+        comments = ta_comments.Comments(self.youtube_id, config=self.config)
+        comments.check_config()
+        if comments.is_activated:
+            comments.delete_comments()
+
     def _get_ryd_stats(self):
         """get optional stats from returnyoutubedislikeapi.com"""
         # pylint: disable=broad-except

From 8f5311ff04f37ae0ae4701854fbda46ee2e0fa70 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 11:33:06 +0700
Subject: [PATCH 16/17] delete comments when deleting channel

---
 tubearchivist/home/src/es/index_mapping.json |  3 +++
 tubearchivist/home/src/index/channel.py      | 12 +++++++++++-
 tubearchivist/home/src/index/comments.py     |  7 +++++--
 3 files changed, 19 insertions(+), 3 deletions(-)

diff --git a/tubearchivist/home/src/es/index_mapping.json b/tubearchivist/home/src/es/index_mapping.json
index 79f1d81..7270563 100644
--- a/tubearchivist/home/src/es/index_mapping.json
+++ b/tubearchivist/home/src/es/index_mapping.json
@@ -473,6 +473,9 @@
                 "comment_last_refresh": {
                     "type": "date"
                 },
+                "comment_channel_id": {
+                    "type": "keyword"
+                },
                 "comment_comments": {
                     "properties": {
                         "comment_id": {
diff --git a/tubearchivist/home/src/index/channel.py b/tubearchivist/home/src/index/channel.py
index 7a554a9..7108d43 100644
--- a/tubearchivist/home/src/index/channel.py
+++ b/tubearchivist/home/src/index/channel.py
@@ -50,7 +50,7 @@ class ChannelScraper:
         url = f"https://www.youtube.com/channel/{self.channel_id}/about?hl=en"
         cookies = {"CONSENT": "YES+xxxxxxxxxxxxxxxxxxxxxxxxxxx"}
         response = requests.get(
-            url, cookies=cookies, headers=requests_headers()
+            url, cookies=cookies, headers=requests_headers(), timeout=10
         )
         if response.ok:
             channel_page = response.text
@@ -275,6 +275,15 @@ class YoutubeChannel(YouTubeItem):
         }
         _, _ = ElasticWrap("ta_video/_delete_by_query").post(data)
 
+    def delete_es_comments(self):
+        """delete all comments from this channel"""
+        data = {
+            "query": {
+                "term": {"comment_channel_id": {"value": self.youtube_id}}
+            }
+        }
+        _, _ = ElasticWrap("ta_comment/_delete_by_query").post(data)
+
     def delete_playlists(self):
         """delete all indexed playlist from es"""
         all_playlists = self.get_indexed_playlists()
@@ -301,6 +310,7 @@ class YoutubeChannel(YouTubeItem):
         self.delete_playlists()
         print(f"{self.youtube_id}: delete indexed videos")
         self.delete_es_videos()
+        self.delete_es_comments()
         self.del_in_es()
 
     def index_channel_playlists(self):
diff --git a/tubearchivist/home/src/index/comments.py b/tubearchivist/home/src/index/comments.py
index 3ad7c9e..0ac2436 100644
--- a/tubearchivist/home/src/index/comments.py
+++ b/tubearchivist/home/src/index/comments.py
@@ -31,12 +31,13 @@ class Comments:
         if not self.is_activated:
             return
 
-        comments_raw = self.get_yt_comments()
+        comments_raw, channel_id = self.get_yt_comments()
         self.format_comments(comments_raw)
 
         self.json_data = {
             "youtube_id": self.youtube_id,
             "comment_last_refresh": int(datetime.now().strftime("%s")),
+            "comment_channel_id": channel_id,
             "comment_comments": self.comments_format,
         }
 
@@ -75,7 +76,8 @@ class Comments:
         yt_obs = self.build_yt_obs()
         info_json = YtWrap(yt_obs).extract(self.youtube_id)
         comments_raw = info_json.get("comments")
-        return comments_raw
+        channel_id = info_json.get("channel_id")
+        return comments_raw, channel_id
 
     def format_comments(self, comments_raw):
         """process comments to match format"""
@@ -141,6 +143,7 @@ class Comments:
 
     def reindex_comments(self):
         """update comments from youtube"""
+        self.check_config()
         if not self.is_activated:
             return
 

From cc965ac473124b2ecab494de6718de1e6505dda1 Mon Sep 17 00:00:00 2001
From: simon <simobilleter@gmail.com>
Date: Fri, 18 Nov 2022 11:35:09 +0700
Subject: [PATCH 17/17] update TA_VERSION to unstable

---
 tubearchivist/config/settings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tubearchivist/config/settings.py b/tubearchivist/config/settings.py
index 5721e98..1f350f0 100644
--- a/tubearchivist/config/settings.py
+++ b/tubearchivist/config/settings.py
@@ -262,4 +262,4 @@ CORS_ALLOW_HEADERS = list(default_headers) + [
 
 # TA application settings
 TA_UPSTREAM = "https://github.com/tubearchivist/tubearchivist"
-TA_VERSION = "v0.2.4"
+TA_VERSION = "v0.2.5-unstable"