From 5df09e7372716101364ddde636386cc32aeb295a Mon Sep 17 00:00:00 2001
From: Michael Vettese <michael.vettese@americanwell.com>
Date: Fri, 10 Jan 2025 11:20:31 -0500
Subject: [PATCH 1/4] Removes deprecated cgi function and replaces with
 email.message.Message

---
 docs/urls.html | 62 +++++++++++++++++++++-----------------------------
 1 file changed, 26 insertions(+), 36 deletions(-)
diff --git a/docs/urls.html b/docs/urls.html
index 8267ca2..72aae7a 100644
--- a/docs/urls.html
+++ b/docs/urls.html
@@ -37,8 +37,8 @@ <h1 class="title">Module <code>pywebcopy.urls</code></h1>
 
 import os
 import re
-from cgi import parse_header
 from collections import namedtuple
+from email.message import Message
 from hashlib import md5
 from zlib import adler32
 
@@ -53,7 +53,7 @@ <h1 class="title">Module <code>pywebcopy.urls</code></h1>
 
 __all__ = [
     &#39;url2path&#39;, &#39;filename_present&#39;, &#39;relate&#39;, &#39;get_etag&#39;, &#39;HIERARCHY&#39;, &#39;LINEAR&#39;,
-    &#39;parse_url&#39;, &#39;parse_header&#39;, &#39;get_host&#39;, &#39;get_prefix&#39;, &#39;get_suffix&#39;,
+    &#39;parse_url&#39;, &#39;Message&#39;, &#39;get_host&#39;, &#39;get_prefix&#39;, &#39;get_suffix&#39;,
     &#39;Url&#39;, &#39;LocationParseError&#39;, &#39;secure_filename&#39;, &#39;split_first&#39;,
     &#39;common_prefix_map&#39;, &#39;common_suffix_map&#39;, &#39;get_content_type_from_headers&#39;,
     &#39;Context&#39;, &#39;ContextError&#39;,
@@ -296,11 +296,17 @@ <h1 class="title">Module <code>pywebcopy.urls</code></h1>
     return md5(string).hexdigest()
 
 
+def parse_separated_header(value: str):
+    m = Message()
+    m[&#39;content-type&#39;] = value
+    return dict(m.get_params())
+
+
 def get_content_type_from_headers(headers, default=None):
     content_type = headers.get(&#39;Content-Type&#39;, default)
     if not content_type:
         return default
-    content_type, params = parse_header(content_type)
+    content_type, params = parse_separated_header(content_type)
     return content_type
 
 
@@ -769,6 +775,21 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     return bool(_filter_and_group_segments(url, remove_query=True, remove_frag=True)[1])</code></pre>
 </details>
 </dd>
+<dt id="pywebcopy.urls.parse_separated_header"><code class="name flex">
+    <span>def <span class="ident">parse_separated_header</span></span>(<span>value: str)</span>
+    </code></dt>
+    <dd>
+    <div class="desc"></div>
+    <details class="source">
+    <summary>
+    <span>Expand source code</span>
+    </summary>
+    <pre><code class="python">def parse_separated_header(value: str):
+        m = Message()
+        m[&#39;content-type&#39;] = value
+        return dict(m.get_params())</code></pre>
+    </details>
+    </dd>
 <dt id="pywebcopy.urls.get_content_type_from_headers"><code class="name flex">
 <span>def <span class="ident">get_content_type_from_headers</span></span>(<span>headers, default=None)</span>
 </code></dt>
@@ -782,7 +803,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     content_type = headers.get(&#39;Content-Type&#39;, default)
     if not content_type:
         return default
-    content_type, params = parse_header(content_type)
+    content_type, params = parse_separated_header(content_type)
     return content_type</code></pre>
 </details>
 </dd>
@@ -844,37 +865,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     return common_suffix_map.get(content_type)</code></pre>
 </details>
 </dd>
-<dt id="pywebcopy.urls.parse_header"><code class="name flex">
-<span>def <span class="ident">parse_header</span></span>(<span>line)</span>
-</code></dt>
-<dd>
-<div class="desc"><p>Parse a Content-type like header.</p>
-<p>Return the main content-type and a dictionary of options.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def parse_header(line):
-    &#34;&#34;&#34;Parse a Content-type like header.
-
-    Return the main content-type and a dictionary of options.
-
-    &#34;&#34;&#34;
-    parts = _parseparam(&#39;;&#39; + line)
-    key = parts.__next__()
-    pdict = {}
-    for p in parts:
-        i = p.find(&#39;=&#39;)
-        if i &gt;= 0:
-            name = p[:i].strip().lower()
-            value = p[i+1:].strip()
-            if len(value) &gt;= 2 and value[0] == value[-1] == &#39;&#34;&#39;:
-                value = value[1:-1]
-                value = value.replace(&#39;\\\\&#39;, &#39;\\&#39;).replace(&#39;\\&#34;&#39;, &#39;&#34;&#39;)
-            pdict[name] = value
-    return key, pdict</code></pre>
-</details>
-</dd>
 <dt id="pywebcopy.urls.parse_url"><code class="name flex">
 <span>def <span class="ident">parse_url</span></span>(<span>url)</span>
 </code></dt>
@@ -1649,7 +1639,7 @@ <h1>Index</h1>
 <li><code><a title="pywebcopy.urls.get_host" href="#pywebcopy.urls.get_host">get_host</a></code></li>
 <li><code><a title="pywebcopy.urls.get_prefix" href="#pywebcopy.urls.get_prefix">get_prefix</a></code></li>
 <li><code><a title="pywebcopy.urls.get_suffix" href="#pywebcopy.urls.get_suffix">get_suffix</a></code></li>
-<li><code><a title="pywebcopy.urls.parse_header" href="#pywebcopy.urls.parse_header">parse_header</a></code></li>
+<li><code><a title="pywebcopy.urls.parse_separated_header" href="#pywebcopy.urls.parse_separated_header">parse_separated_header</a></code></li>
 <li><code><a title="pywebcopy.urls.parse_url" href="#pywebcopy.urls.parse_url">parse_url</a></code></li>
 <li><code><a title="pywebcopy.urls.relate" href="#pywebcopy.urls.relate">relate</a></code></li>
 <li><code><a title="pywebcopy.urls.secure_filename" href="#pywebcopy.urls.secure_filename">secure_filename</a></code></li>

From ca23196616a2fd44bbefdb44be2ad426b45460c4 Mon Sep 17 00:00:00 2001
From: Michael Vettese <michael.vettese@americanwell.com>
Date: Wed, 15 Jan 2025 10:38:01 -0500
Subject: [PATCH 2/4] Adds urls file

---
 pywebcopy/urls.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/pywebcopy/urls.py b/pywebcopy/urls.py
index 18480cc..be837fe 100644
--- a/pywebcopy/urls.py
+++ b/pywebcopy/urls.py
@@ -9,8 +9,8 @@
 
 import os
 import re
-from cgi import parse_header
 from collections import namedtuple
+from email.message import Message
 from hashlib import md5
 from zlib import adler32
 
@@ -25,7 +25,7 @@
 
 __all__ = [
     'url2path', 'filename_present', 'relate', 'get_etag', 'HIERARCHY', 'LINEAR',
-    'parse_url', 'parse_header', 'get_host', 'get_prefix', 'get_suffix',
+    'parse_url', 'Message', 'get_host', 'get_prefix', 'get_suffix',
     'Url', 'LocationParseError', 'secure_filename', 'split_first',
     'common_prefix_map', 'common_suffix_map', 'get_content_type_from_headers',
     'Context', 'ContextError',
@@ -272,11 +272,18 @@ def get_etag(string):
     return md5(string).hexdigest()
 
 
+def parse_separated_header(value: str):
+    # Adapted from https://peps.python.org/pep-0594/#cgi
+    m = Message()
+    m['content-type'] = value
+    return dict(m.get_params())
+
+
 def get_content_type_from_headers(headers, default=None):
     content_type = headers.get('Content-Type', default)
     if not content_type:
         return default
-    content_type, params = parse_header(content_type)
+    content_type = parse_separated_header(content_type)
     return content_type
 
 

From a1c5cffae833db73e0ba493cd0fe48e2038e6a08 Mon Sep 17 00:00:00 2001
From: Michael Vettese <michael.vettese@americanwell.com>
Date: Tue, 28 Jan 2025 14:12:51 -0500
Subject: [PATCH 3/4] Update parseheader function

---
 docs/urls.html    |  7 ++++---
 pywebcopy/urls.py | 10 +++++-----
 2 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/docs/urls.html b/docs/urls.html
index 72aae7a..b16cbe8 100644
--- a/docs/urls.html
+++ b/docs/urls.html
@@ -785,9 +785,10 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     <span>Expand source code</span>
     </summary>
     <pre><code class="python">def parse_separated_header(value: str):
-        m = Message()
-        m[&#39;content-type&#39;] = value
-        return dict(m.get_params())</code></pre>
+        msg = EmailMessage()
+        msg[&#39;content-type&#39;] = &#39;application/json; charset=&#39;utf8&#39;&#39;
+        main, params = msg.get_content_type(), msg[&#39;content-type&#39;].params
+        return main, params</code></pre>
     </details>
     </dd>
 <dt id="pywebcopy.urls.get_content_type_from_headers"><code class="name flex">
diff --git a/pywebcopy/urls.py b/pywebcopy/urls.py
index be837fe..a8ab7f0 100644
--- a/pywebcopy/urls.py
+++ b/pywebcopy/urls.py
@@ -10,7 +10,7 @@
 import os
 import re
 from collections import namedtuple
-from email.message import Message
+from email.message import EmailMessage
 from hashlib import md5
 from zlib import adler32
 
@@ -273,10 +273,10 @@ def get_etag(string):
 
 
 def parse_separated_header(value: str):
-    # Adapted from https://peps.python.org/pep-0594/#cgi
-    m = Message()
-    m['content-type'] = value
-    return dict(m.get_params())
+    msg = EmailMessage()
+    msg['content-type'] = 'application/json; charset="utf8"'
+    main, params = msg.get_content_type(), msg['content-type'].params
+    return main, params
 
 
 def get_content_type_from_headers(headers, default=None):

From a9ba09f48b0f8cd24e9748b6486ea409eec926f1 Mon Sep 17 00:00:00 2001
From: Michael Vettese <michael.vettese@americanwell.com>
Date: Fri, 7 Feb 2025 11:21:34 -0500
Subject: [PATCH 4/4] Updates docs

---
 docs/urls.html | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/docs/urls.html b/docs/urls.html
index b16cbe8..c23753b 100644
--- a/docs/urls.html
+++ b/docs/urls.html
@@ -297,16 +297,17 @@ <h1 class="title">Module <code>pywebcopy.urls</code></h1>
 
 
 def parse_separated_header(value: str):
-    m = Message()
-    m[&#39;content-type&#39;] = value
-    return dict(m.get_params())
+    msg = EmailMessage()
+    msg['content-type'] = 'application/json; charset="utf8"'
+    main, params = msg.get_content_type(), msg['content-type'].params
+    return main, params
 
 
 def get_content_type_from_headers(headers, default=None):
     content_type = headers.get(&#39;Content-Type&#39;, default)
     if not content_type:
         return default
-    content_type, params = parse_separated_header(content_type)
+    content_type = parse_separated_header(content_type)
     return content_type
 
 
@@ -804,7 +805,7 @@ <h2 class="section-title" id="header-functions">Functions</h2>
     content_type = headers.get(&#39;Content-Type&#39;, default)
     if not content_type:
         return default
-    content_type, params = parse_separated_header(content_type)
+    content_type = parse_separated_header(content_type)
     return content_type</code></pre>
 </details>
 </dd>