From 20dbc910ba49f2b292c7c61933b72163a818a339 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?M=C3=A9lodie=20Boillet?= <boillet@teklia.com>
Date: Thu, 3 Aug 2023 08:34:33 +0200
Subject: [PATCH] Apply 65177a4b

---
 dan/encoder.py                       | 4 +---
 dan/ocr/document/train.py            | 1 -
 docs/get_started/training.md         | 1 -
 docs/usage/train/parameters.md       | 1 -
 tests/conftest.py                    | 1 -
 tests/data/prediction/parameters.yml | 1 -
 6 files changed, 1 insertion(+), 8 deletions(-)

diff --git a/dan/encoder.py b/dan/encoder.py
index 6057cadd..0e38f633 100644
--- a/dan/encoder.py
+++ b/dan/encoder.py
@@ -92,9 +92,7 @@ class FCN_Encoder(Module):
 
         self.init_blocks = ModuleList(
             [
-                ConvBlock(
-                    params["input_channels"], 16, stride=(1, 1), dropout=self.dropout
-                ),
+                ConvBlock(3, 16, stride=(1, 1), dropout=self.dropout),
                 ConvBlock(16, 32, stride=(2, 2), dropout=self.dropout),
                 ConvBlock(32, 64, stride=(2, 2), dropout=self.dropout),
                 ConvBlock(64, 128, stride=(2, 2), dropout=self.dropout),
diff --git a/dan/ocr/document/train.py b/dan/ocr/document/train.py
index ad4643b9..97cae761 100644
--- a/dan/ocr/document/train.py
+++ b/dan/ocr/document/train.py
@@ -138,7 +138,6 @@ def get_config():
             },
             "transfered_charset": True,  # Transfer learning of the decision layer based on charset of the line HTR model
             "additional_tokens": 1,  # for decision layer = [<eot>, ], only for transferred charset
-            "input_channels": 3,  # number of channels of input image
             "dropout": 0.5,  # dropout rate for encoder
             "enc_dim": 256,  # dimension of extracted features
             "nb_layers": 5,  # encoder
diff --git a/docs/get_started/training.md b/docs/get_started/training.md
index 598eba39..71cdd974 100644
--- a/docs/get_started/training.md
+++ b/docs/get_started/training.md
@@ -53,7 +53,6 @@ parameters:
   std: [float, float, float]
   max_char_prediction: int
   encoder:
-    input_channels: int
     dropout: float
   decoder:
     enc_dim: int
diff --git a/docs/usage/train/parameters.md b/docs/usage/train/parameters.md
index d659a1e0..5dd48610 100644
--- a/docs/usage/train/parameters.md
+++ b/docs/usage/train/parameters.md
@@ -132,7 +132,6 @@ For a detailed description of all augmentation transforms, see the [dedicated pa
 | `model_params.transfer_learning.decoder`  | Model to load for the decoder [state_dict_name, checkpoint_path, learnable, strict]. | `list`       | `["encoder", "pretrained_models/dan_rimes_page.pt", True, False]` |
 | `model_params.transfered_charset`         | Transfer learning of the decision layer based on charset of the model to transfer.   | `bool`       | `True`                                                            |
 | `model_params.additional_tokens`          | For decision layer = [<eot>, ], only for transferred charset.                        | `int`        | `1`                                                               |
-| `model_params.input_channels`             | Number of channels of input image.                                                   | `int`        | `3`                                                               |
 | `model_params.dropout`                    | Dropout probability in the encoder.                                                  | `float`      | `0.5`                                                             |
 | `model_params.enc_dim`                    | Dimension of features extracted by the encoder.                                      | `int`        | `256`                                                             |
 | `model_params.nb_layers`                  | Number of layers in the encoder.                                                     | `int`        | `5`                                                               |
diff --git a/tests/conftest.py b/tests/conftest.py
index e804cb36..4a365be7 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -86,7 +86,6 @@ def training_config():
             "transfer_learning": None,
             "transfered_charset": True,  # Transfer learning of the decision layer based on charset of the line HTR model
             "additional_tokens": 1,  # for decision layer = [<eot>, ], only for transferred charset
-            "input_channels": 3,  # number of channels of input image
             "dropout": 0.5,  # dropout rate for encoder
             "enc_dim": 256,  # dimension of extracted features
             "nb_layers": 5,  # encoder
diff --git a/tests/data/prediction/parameters.yml b/tests/data/prediction/parameters.yml
index c299406c..f07baaec 100644
--- a/tests/data/prediction/parameters.yml
+++ b/tests/data/prediction/parameters.yml
@@ -5,7 +5,6 @@ parameters:
   std: [34.084189571536385, 34.084189571536385, 34.084189571536385]
   max_char_prediction: 200
   encoder:
-    input_channels: 3
     dropout: 0.5
   decoder:
     enc_dim: 256
-- 
GitLab