saurabhshri · MatejMecka · Jan 2, 2018 · Jan 2, 2018 · Jan 2, 2018 · Jan 2, 2018
diff --git a/srtparser.h b/srtparser.h
@@ -92,7 +92,6 @@ class SubtitleItem
     std::vector<std::string> getNonDialogueWords(); //return string vector of non dialogue words
     std::vector<std::string> getStyleTags();    //return string vector of style tags
 
-
     void setStartTime(long int startTime);  //set starting time
     void setEndTime(long int endTime);      //set ending time
     void setText(std::string text);         //set subtitle text
@@ -382,17 +381,12 @@ inline void SubtitleItem::extractInfo(bool keepHTML, bool doNotIgnoreNonDialogue
     //stripping HTML tags
     if(!keepHTML)
     {
-        /*
-         * TODO : Before erasing, extract the words.
-         * std::vector<std::string> getStyleTags();
-         * int getStyleTagCount() const;
-         * std::vector<std::string> _styleTag;
-         * int _styleTagCount;
-         */
 
         int countP = 0;
+        std::string tag;
         for(char& c : output) // replacing <...> with ~~~~
         {
+
             if(c=='<')
             {
                 countP++;
@@ -403,34 +397,37 @@ inline void SubtitleItem::extractInfo(bool keepHTML, bool doNotIgnoreNonDialogue
             {
                 if(countP!=0)
                 {
-                    if(c != '>')
-                        c = '~';
-
+                    if(c != '>'){
+                            tag += c;
+                            c = '~';
+                    }
                     else if(c == '>')
                     {
                         c = '~';
                         countP--;
+                        _styleTagCount++;
+                        if(tag[0] == '/'){
+                            tag.erase(0,1);
+                        }
+                        _nonDialogue.push_back(tag);
+                        tag="";
                     }
                 }
             }
+
         }
+
     }
 
     //stripping non dialogue data e.g. (applause)
 
     if(!doNotIgnoreNonDialogues)
     {
-        /*
-         * TODO : Before erasing, extract the words.
-         * std::vector<std::string> getNonDialogueWords();
-         * int getNonDialogueCount() const;
-         * std::vector<std::string> _nonDialogue;
-         * int _nonDialogueCount;
-         */
-
         int countP = 0;
+        std::string tag;
         for(char& c : output)   // replacing (...) with ~~~~
         {
+
             if(c=='(')
             {
                 countP++;
@@ -441,13 +438,17 @@ inline void SubtitleItem::extractInfo(bool keepHTML, bool doNotIgnoreNonDialogue
             {
                 if(countP!=0)
                 {
-                    if(c != ')')
+                    if(c != ')'){
+                        tag.push_back(c);
                         c = '~';
-
+                    }
                     else if(c == ')')
                     {
                         c = '~';
                         countP--;
+                        _nonDialogueCount++;
+                        _nonDialogue.push_back(tag);
+                        tag="";
                     }
                 }
             }
@@ -654,4 +655,4 @@ inline SubtitleWord::~SubtitleWord(void)
 }
 
 
-#endif //SRTPARSER_H
+#endif //SRTPARSER_H