Merge pull request #23 from tomas-gajarsky/feature/expand_box_ratio

tomas-gajarsky · web-flow · commit 51991d0c14b2 · 2022-11-10T17:17:50.000+01:00
Feature/expand box ratio
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -1,5 +1,16 @@
 # Change Log
 
+
+## 0.1.2
+
+Released on November 10, 2022.
+
+### Added
+* links to Demo App and User Guide in README.md
+
+### Changed
+* Box expansion method changed from static absolute value to dynamic relative value
+
 ## 0.1.1
 
 Released on August 31, 2022.
diff --git a/README.md b/README.md
@@ -6,8 +6,11 @@
 [![PyPI - License](https://img.shields.io/pypi/l/facetorch)](https://raw.githubusercontent.com/tomas-gajarsky/facetorch/main/LICENSE)
 <a href="https://github.com/psf/black"><img alt="Code style: black" src="https://img.shields.io/badge/code%20style-black-000000.svg"></a>
 
+[Demo App on Hugging Face Spaces 🤗 ](https://huggingface.co/spaces/tomas-gajarsky/facetorch-app)
 
-[Documentation](https://tomas-gajarsky.github.io/facetorch/facetorch/index.html), [Docker Hub](https://hub.docker.com/repository/docker/tomasgajarsky/facetorch) [(GPU)](https://hub.docker.com/repository/docker/tomasgajarsky/facetorch-gpu)
+[User Guide](https://medium.com/@gajarsky.tomas/facetorch-user-guide-a0e9fd2a5552), [Documentation](https://tomas-gajarsky.github.io/facetorch/facetorch/index.html)
+ 
+[Docker Hub](https://hub.docker.com/repository/docker/tomasgajarsky/facetorch) [(GPU)](https://hub.docker.com/repository/docker/tomasgajarsky/facetorch-gpu)
 
 Facetorch is a Python library that can detect faces and analyze facial features using deep neural networks. The goal is to gather open sourced face analysis models from the community, optimize them for performance using TorchScript and combine them to create a face analysis tool that one can:
 
diff --git a/conf/analyzer/detector/retinaface.yaml b/conf/analyzer/detector/retinaface.yaml
@@ -45,4 +45,4 @@ postprocessor:
     clip: False
   variance: [0.1, 0.2]
   reverse_colors: ${analyzer.detector.reverse_colors} # True # bool
-  expand_pixels: 4 # int
+  expand_box_ratio: 0.15 # float
diff --git a/docs/facetorch/analyzer/detector/index.html b/docs/facetorch/analyzer/detector/index.html
@@ -1,7 +1,6 @@
 <!doctype html>
 <html lang="en">
 <head>
-<meta name="google-site-verification" content="YIhgkma200wIq_XsAUQ9zFq2isMAdB5CUSrzqys38y4" />
 <meta charset="utf-8">
 <meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
 <meta name="generator" content="pdoc 0.10.0" />
@@ -252,7 +251,6 @@ <h4><code><a title="facetorch.analyzer.detector.FaceDetector" href="#facetorch.a
 </nav>
 </main>
 <footer id="footer">
-<p><a href="https://github.com/tomas-gajarsky/facetorch" title="facetorch: detect faces and analyze facial features using neural networks"><cite>facetorch GitHub repository</cite></a></p>
 <p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
 </footer>
 </body>
diff --git a/docs/facetorch/analyzer/detector/post.html b/docs/facetorch/analyzer/detector/post.html
@@ -145,7 +145,7 @@ <h1 class="title">Module <code>facetorch.analyzer.detector.post</code></h1>
         prior_box: PriorBox,
         variance: List[float],
         reverse_colors: bool = False,
-        expand_pixels: int = 0,
+        expand_box_ratio: float = 0.0,
     ):
         &#34;&#34;&#34;Initialize the detector postprocessor. Modified from https://github.com/biubug6/Pytorch_Retinaface.
 
@@ -161,7 +161,7 @@ <h1 class="title">Module <code>facetorch.analyzer.detector.post</code></h1>
             prior_box (PriorBox): PriorBox object.
             variance (List[float]): Prior box variance.
             reverse_colors (bool): Whether to reverse the colors of the image tensor from RGB to BGR or vice versa. If False, the colors remain unchanged. Default: False.
-            expand_pixels (int): Number of pixels to expand the face location and tensor by. Default: 0.
+            expand_box_ratio (float): Expand the box by this ratio. Default: 0.0.
         &#34;&#34;&#34;
         super().__init__(transform, device, optimize_transform)
         self.confidence_threshold = confidence_threshold
@@ -172,7 +172,7 @@ <h1 class="title">Module <code>facetorch.analyzer.detector.post</code></h1>
         self.prior_box = prior_box
         self.variance = list(variance)
         self.reverse_colors = reverse_colors
-        self.expand_pixels = expand_pixels
+        self.expand_box_ratio = expand_box_ratio
 
     @Timer(&#34;PostRetFace.run&#34;, &#34;{name}: {milliseconds:.2f} ms&#34;, logger.debug)
     def run(
@@ -313,7 +313,7 @@ <h1 class="title">Module <code>facetorch.analyzer.detector.post</code></h1>
                 y2=int(_det[3]),
             )
 
-            loc.expand(amount=self.expand_pixels)
+            loc.expand(amount=self.expand_box_ratio)
             loc.form_square()
 
             return loc
@@ -587,7 +587,7 @@ <h2 id="returns">Returns</h2>
 </dd>
 <dt id="facetorch.analyzer.detector.post.PostRetFace"><code class="flex name class">
 <span>class <span class="ident">PostRetFace</span></span>
-<span>(</span><span>transform: torchvision.transforms.transforms.Compose, device: torch.device, optimize_transform: bool, confidence_threshold: float, top_k: int, nms_threshold: float, keep_top_k: int, score_threshold: float, prior_box: <a title="facetorch.analyzer.detector.post.PriorBox" href="#facetorch.analyzer.detector.post.PriorBox">PriorBox</a>, variance: List[float], reverse_colors: bool = False, expand_pixels: int = 0)</span>
+<span>(</span><span>transform: torchvision.transforms.transforms.Compose, device: torch.device, optimize_transform: bool, confidence_threshold: float, top_k: int, nms_threshold: float, keep_top_k: int, score_threshold: float, prior_box: <a title="facetorch.analyzer.detector.post.PriorBox" href="#facetorch.analyzer.detector.post.PriorBox">PriorBox</a>, variance: List[float], reverse_colors: bool = False, expand_box_ratio: float = 0.0)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Initialize the detector postprocessor. Modified from <a href="https://github.com/biubug6/Pytorch_Retinaface.">https://github.com/biubug6/Pytorch_Retinaface.</a></p>
@@ -615,8 +615,8 @@ <h2 id="args">Args</h2>
 <dd>Prior box variance.</dd>
 <dt><strong><code>reverse_colors</code></strong> :&ensp;<code>bool</code></dt>
 <dd>Whether to reverse the colors of the image tensor from RGB to BGR or vice versa. If False, the colors remain unchanged. Default: False.</dd>
-<dt><strong><code>expand_pixels</code></strong> :&ensp;<code>int</code></dt>
-<dd>Number of pixels to expand the face location and tensor by. Default: 0.</dd>
+<dt><strong><code>expand_box_ratio</code></strong> :&ensp;<code>float</code></dt>
+<dd>Expand the box by this ratio. Default: 0.0.</dd>
 </dl></div>
 <details class="source">
 <summary>
@@ -637,7 +637,7 @@ <h2 id="args">Args</h2>
         prior_box: PriorBox,
         variance: List[float],
         reverse_colors: bool = False,
-        expand_pixels: int = 0,
+        expand_box_ratio: float = 0.0,
     ):
         &#34;&#34;&#34;Initialize the detector postprocessor. Modified from https://github.com/biubug6/Pytorch_Retinaface.
 
@@ -653,7 +653,7 @@ <h2 id="args">Args</h2>
             prior_box (PriorBox): PriorBox object.
             variance (List[float]): Prior box variance.
             reverse_colors (bool): Whether to reverse the colors of the image tensor from RGB to BGR or vice versa. If False, the colors remain unchanged. Default: False.
-            expand_pixels (int): Number of pixels to expand the face location and tensor by. Default: 0.
+            expand_box_ratio (float): Expand the box by this ratio. Default: 0.0.
         &#34;&#34;&#34;
         super().__init__(transform, device, optimize_transform)
         self.confidence_threshold = confidence_threshold
@@ -664,7 +664,7 @@ <h2 id="args">Args</h2>
         self.prior_box = prior_box
         self.variance = list(variance)
         self.reverse_colors = reverse_colors
-        self.expand_pixels = expand_pixels
+        self.expand_box_ratio = expand_box_ratio
 
     @Timer(&#34;PostRetFace.run&#34;, &#34;{name}: {milliseconds:.2f} ms&#34;, logger.debug)
     def run(
@@ -805,7 +805,7 @@ <h2 id="args">Args</h2>
                 y2=int(_det[3]),
             )
 
-            loc.expand(amount=self.expand_pixels)
+            loc.expand(amount=self.expand_box_ratio)
             loc.form_square()
 
             return loc
diff --git a/docs/facetorch/datastruct.html b/docs/facetorch/datastruct.html
@@ -86,20 +86,27 @@ <h1 class="title">Module <code>facetorch.datastruct</code></h1>
         else:
             pass
 
-    def expand(self, amount: int) -&gt; None:
+    def expand(self, amount: float) -&gt; None:
         &#34;&#34;&#34;Expand the location while keeping the center.
 
         Args:
-            amount (int): Amount of pixels to expand the location by.
+            amount (float): Amount to expand the location by in multiples of the original size.
+
 
         Returns:
             None
         &#34;&#34;&#34;
-        if amount != 0:
-            self.x1 = self.x1 - amount
-            self.y1 = self.y1 - amount
-            self.x2 = self.x2 + amount
-            self.y2 = self.y2 + amount
+        assert amount &gt;= 0, &#34;Amount must be greater than or equal to 0.&#34;
+        # if amount != 0:
+        #     self.x1 = self.x1 - amount
+        #     self.y1 = self.y1 - amount
+        #     self.x2 = self.x2 + amount
+        #     self.y2 = self.y2 + amount
+        if amount != 0.0:
+            self.x1 = self.x1 - int((self.x2 - self.x1) / 2 * amount)
+            self.y1 = self.y1 - int((self.y2 - self.y1) / 2 * amount)
+            self.x2 = self.x2 + int((self.x2 - self.x1) / 2 * amount)
+            self.y2 = self.y2 + int((self.y2 - self.y1) / 2 * amount)
 
 
 @dataclass
@@ -302,8 +309,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class Dimensions:
+<pre><code class="python">class Dimensions:
     &#34;&#34;&#34;Data class for image dimensions.
 
     Attributes:
@@ -347,8 +353,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class Location:
+<pre><code class="python">class Location:
     &#34;&#34;&#34;Data class for face location.
 
     Attributes:
@@ -383,20 +388,27 @@ <h2 id="attributes">Attributes</h2>
         else:
             pass
 
-    def expand(self, amount: int) -&gt; None:
+    def expand(self, amount: float) -&gt; None:
         &#34;&#34;&#34;Expand the location while keeping the center.
 
         Args:
-            amount (int): Amount of pixels to expand the location by.
+            amount (float): Amount to expand the location by in multiples of the original size.
+
 
         Returns:
             None
         &#34;&#34;&#34;
-        if amount != 0:
-            self.x1 = self.x1 - amount
-            self.y1 = self.y1 - amount
-            self.x2 = self.x2 + amount
-            self.y2 = self.y2 + amount</code></pre>
+        assert amount &gt;= 0, &#34;Amount must be greater than or equal to 0.&#34;
+        # if amount != 0:
+        #     self.x1 = self.x1 - amount
+        #     self.y1 = self.y1 - amount
+        #     self.x2 = self.x2 + amount
+        #     self.y2 = self.y2 + amount
+        if amount != 0.0:
+            self.x1 = self.x1 - int((self.x2 - self.x1) / 2 * amount)
+            self.y1 = self.y1 - int((self.y2 - self.y1) / 2 * amount)
+            self.x2 = self.x2 + int((self.x2 - self.x1) / 2 * amount)
+            self.y2 = self.y2 + int((self.y2 - self.y1) / 2 * amount)</code></pre>
 </details>
 <h3>Class variables</h3>
 <dl>
@@ -452,42 +464,49 @@ <h2 id="returns">Returns</h2>
 </details>
 </dd>
 <dt id="facetorch.datastruct.Location.expand"><code class="name flex">
-<span>def <span class="ident">expand</span></span>(<span>self, amount: int) ‑> None</span>
+<span>def <span class="ident">expand</span></span>(<span>self, amount: float) ‑> None</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Expand the location while keeping the center.</p>
 <h2 id="args">Args</h2>
 <dl>
-<dt><strong><code>amount</code></strong> :&ensp;<code>int</code></dt>
-<dd>Amount of pixels to expand the location by.</dd>
+<dt><strong><code>amount</code></strong> :&ensp;<code>float</code></dt>
+<dd>Amount to expand the location by in multiples of the original size.</dd>
 </dl>
 <h2 id="returns">Returns</h2>
 <p>None</p></div>
 <details class="source">
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">def expand(self, amount: int) -&gt; None:
+<pre><code class="python">def expand(self, amount: float) -&gt; None:
     &#34;&#34;&#34;Expand the location while keeping the center.
 
     Args:
-        amount (int): Amount of pixels to expand the location by.
+        amount (float): Amount to expand the location by in multiples of the original size.
+
 
     Returns:
         None
     &#34;&#34;&#34;
-    if amount != 0:
-        self.x1 = self.x1 - amount
-        self.y1 = self.y1 - amount
-        self.x2 = self.x2 + amount
-        self.y2 = self.y2 + amount</code></pre>
+    assert amount &gt;= 0, &#34;Amount must be greater than or equal to 0.&#34;
+    # if amount != 0:
+    #     self.x1 = self.x1 - amount
+    #     self.y1 = self.y1 - amount
+    #     self.x2 = self.x2 + amount
+    #     self.y2 = self.y2 + amount
+    if amount != 0.0:
+        self.x1 = self.x1 - int((self.x2 - self.x1) / 2 * amount)
+        self.y1 = self.y1 - int((self.y2 - self.y1) / 2 * amount)
+        self.x2 = self.x2 + int((self.x2 - self.x1) / 2 * amount)
+        self.y2 = self.y2 + int((self.y2 - self.y1) / 2 * amount)</code></pre>
 </details>
 </dd>
 </dl>
 </dd>
 <dt id="facetorch.datastruct.Prediction"><code class="flex name class">
 <span>class <span class="ident">Prediction</span></span>
-<span>(</span><span>label: str = &lt;factory&gt;, logits: torch.Tensor = &lt;factory&gt;, other: Dict = &lt;factory&gt;)</span>
+<span>(</span><span>label: str = &lt;factory&gt;, logits: torch.Tensor = &lt;factory&gt;, other: Dict[~KT, ~VT] = &lt;factory&gt;)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Data class for face prediction results and derivatives.</p>
@@ -504,8 +523,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class Prediction:
+<pre><code class="python">class Prediction:
     &#34;&#34;&#34;Data class for face prediction results and derivatives.
 
     Attributes:
@@ -528,7 +546,7 @@ <h3>Class variables</h3>
 <dd>
 <div class="desc"></div>
 </dd>
-<dt id="facetorch.datastruct.Prediction.other"><code class="name">var <span class="ident">other</span> : Dict</code></dt>
+<dt id="facetorch.datastruct.Prediction.other"><code class="name">var <span class="ident">other</span> : Dict[~KT, ~VT]</code></dt>
 <dd>
 <div class="desc"></div>
 </dd>
@@ -557,8 +575,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class Detection:
+<pre><code class="python">class Detection:
     &#34;&#34;&#34;Data class for detector output.
 
     Attributes:
@@ -625,8 +642,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class Face:
+<pre><code class="python">class Face:
     &#34;&#34;&#34;Data class for face attributes.
 
     Attributes:
@@ -702,8 +718,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class ImageData:
+<pre><code class="python">class ImageData:
     &#34;&#34;&#34;The main data class used for passing data between the different facetorch modules.
 
     Attributes:
@@ -1045,8 +1060,7 @@ <h2 id="attributes">Attributes</h2>
 <summary>
 <span>Expand source code</span>
 </summary>
-<pre><code class="python">@dataclass
-class Response:
+<pre><code class="python">class Response:
     &#34;&#34;&#34;Data class for response data, which is a subset of ImageData.
 
     Attributes:
diff --git a/docs/facetorch/index.html b/docs/facetorch/index.html
@@ -1,6 +1,7 @@
 <!doctype html>
 <html lang="en">
 <head>
+<meta name="google-site-verification" content="YIhgkma200wIq_XsAUQ9zFq2isMAdB5CUSrzqys38y4" />
 <meta charset="utf-8">
 <meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
 <meta name="generator" content="pdoc 0.10.0" />
@@ -453,6 +454,7 @@ <h4><code><a title="facetorch.FaceAnalyzer" href="#facetorch.FaceAnalyzer">FaceA
 </nav>
 </main>
 <footer id="footer">
+<p><a href="https://github.com/tomas-gajarsky/facetorch" title="facetorch: detect faces and analyze facial features using neural networks"><cite>facetorch GitHub repository</cite></a></p>
 <p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
 </footer>
 </body>
diff --git a/docs/facetorch/transforms.html b/docs/facetorch/transforms.html
@@ -197,6 +197,17 @@ <h3>Ancestors</h3>
 <ul class="hlist">
 <li>torch.nn.modules.module.Module</li>
 </ul>
+<h3>Class variables</h3>
+<dl>
+<dt id="facetorch.transforms.SquarePad.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
+<dd>
+<div class="desc"></div>
+</dd>
+<dt id="facetorch.transforms.SquarePad.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
+<dd>
+<div class="desc"></div>
+</dd>
+</dl>
 <h3>Methods</h3>
 <dl>
 <dt id="facetorch.transforms.SquarePad.forward"><code class="name flex">
@@ -304,6 +315,8 @@ <h1>Index</h1>
 <h4><code><a title="facetorch.transforms.SquarePad" href="#facetorch.transforms.SquarePad">SquarePad</a></code></h4>
 <ul class="">
 <li><code><a title="facetorch.transforms.SquarePad.forward" href="#facetorch.transforms.SquarePad.forward">forward</a></code></li>
+<li><code><a title="facetorch.transforms.SquarePad.dump_patches" href="#facetorch.transforms.SquarePad.dump_patches">dump_patches</a></code></li>
+<li><code><a title="facetorch.transforms.SquarePad.training" href="#facetorch.transforms.SquarePad.training">training</a></code></li>
 </ul>
 </li>
 </ul>
diff --git a/docs/index.js b/docs/index.js
diff --git a/facetorch/analyzer/detector/post.py b/facetorch/analyzer/detector/post.py
diff --git a/facetorch/datastruct.py b/facetorch/datastruct.py
diff --git a/version b/version