From 6bfb517c1668aad49d4f0090daa5dca2f7cb0ecc Mon Sep 17 00:00:00 2001
From: AdoptMeTradingValues
 <108958603+AdoptMeTradingValues@users.noreply.github.com>
Date: Mon, 29 Jan 2024 21:43:12 -0500
Subject: [PATCH 1/4] Delete train.py

---
 train.py | 210 -------------------------------------------------------
 1 file changed, 210 deletions(-)
 delete mode 100644 train.py

diff --git a/train.py b/train.py
deleted file mode 100644
index 7605b2f..0000000
--- a/train.py
+++ /dev/null
@@ -1,210 +0,0 @@
-import argparse
-import os
-
-import torch
-
-import handwriting_synthesis.callbacks
-import handwriting_synthesis.tasks
-from handwriting_synthesis import training
-from handwriting_synthesis import data, utils, models, metrics
-from handwriting_synthesis.sampling import UnconditionalSampler, HandwritingSynthesizer
-
-
-class ConfigOptions:
-    def __init__(self, batch_size, epochs, sampling_interval,
-                 num_train_examples, num_val_examples, max_length,
-                 model_path, charset_path, samples_dir,
-                 output_clip_value, lstm_clip_value):
-        self.batch_size = batch_size
-        self.epochs = epochs
-        self.sampling_interval = sampling_interval
-        self.num_train_examples = num_train_examples
-        self.num_val_examples = num_val_examples
-        self.max_length = max_length
-        self.model_path = model_path
-        self.charset_path = charset_path
-        self.samples_dir = samples_dir
-        self.output_clip_value = output_clip_value
-        self.lstm_clip_value = lstm_clip_value
-
-
-def print_info_message(training_task_verbose, config):
-    print(f'{training_task_verbose} with options: training set size {config.num_train_examples}, '
-          f'validation set size {config.num_val_examples}, '
-          f'batch size {config.batch_size}, '
-          f'max sequence length {config.max_length},'
-          f'sampling interval (in # iterations): {config.sampling_interval}')
-
-
-def train_model(train_set, val_set, train_task, callbacks, config, training_task_verbose, sampler):
-    print_info_message(training_task_verbose, config)
-
-    train_metrics = [metrics.MSE(), metrics.SSE()]
-    val_metrics = [metrics.MSE(), metrics.SSE()]
-
-    loop = training.TrainingLoop(train_set, val_set, batch_size=config.batch_size, training_task=train_task,
-                                 train_metrics=train_metrics, val_metrics=val_metrics)
-
-    for cb in callbacks:
-        loop.add_callback(cb)
-
-    sample_class = sampler.__class__
-    _, largest_epoch = sample_class.load_latest(check_points_dir=config.model_path,
-                                                device=torch.device("cpu"))
-
-    saver = handwriting_synthesis.callbacks.EpochModelCheckpoint(
-        sampler, config.model_path, save_interval=1
-    )
-    loop.add_callback(saver)
-
-    loop.start(initial_epoch=largest_epoch, epochs=config.epochs)
-
-
-def train_unconditional_handwriting_generator(train_set, val_set, device, config):
-    sampler, epochs = UnconditionalSampler.load_latest(config.model_path, device)
-    if sampler:
-        model = sampler.model
-    else:
-        model = models.HandwritingPredictionNetwork.get_default_model(device)
-        model = model.to(device)
-
-    if not sampler:
-        mu = torch.tensor(train_set.mu, dtype=torch.float32)
-        sd = torch.tensor(train_set.std, dtype=torch.float32)
-        tokenizer = data.Tokenizer.from_file(config.charset_path)
-        sampler = UnconditionalSampler(model, mu, sd, tokenizer.charset, num_steps=config.max_length)
-
-    if config.output_clip_value == 0 or config.lstm_clip_value == 0:
-        clip_values = None
-    else:
-        clip_values = (config.output_clip_value, config.lstm_clip_value)
-
-    train_task = handwriting_synthesis.tasks.HandwritingPredictionTrainingTask(device, model, clip_values)
-
-    cb = handwriting_synthesis.callbacks.HandwritingGenerationCallback(
-        model, config.samples_dir, config.max_length,
-        val_set, iteration_interval=config.sampling_interval
-    )
-
-    train_model(train_set, val_set, train_task, [cb], config,
-                training_task_verbose='Training (unconditional) handwriting prediction model', sampler=sampler)
-
-
-def train_handwriting_synthesis_model(train_set, val_set, device, config):
-    synthesizer, epochs = HandwritingSynthesizer.load_latest(config.model_path, device)
-
-    if synthesizer:
-        model = synthesizer.model
-    else:
-        tokenizer = data.Tokenizer.from_file(config.charset_path)
-        alphabet_size = tokenizer.size
-
-        model = models.SynthesisNetwork.get_default_model(alphabet_size, device)
-        model = model.to(device)
-
-        mu = torch.tensor(train_set.mu, dtype=torch.float32)
-        sd = torch.tensor(train_set.std, dtype=torch.float32)
-        synthesizer = HandwritingSynthesizer(
-            model, mu, sd, tokenizer.charset, num_steps=config.max_length
-        )
-
-    if config.output_clip_value == 0 or config.lstm_clip_value == 0:
-        clip_values = None
-    else:
-        clip_values = (config.output_clip_value, config.lstm_clip_value)
-
-    train_task = handwriting_synthesis.tasks.HandwritingSynthesisTask(
-        synthesizer.tokenizer, device, model, clip_values
-    )
-
-    cb = handwriting_synthesis.callbacks.HandwritingSynthesisCallback(
-        synthesizer.tokenizer,
-        10,
-        model, config.samples_dir, config.max_length,
-        val_set, iteration_interval=config.sampling_interval
-    )
-
-    train_model(train_set, val_set, train_task, [cb], config,
-                training_task_verbose='Training handwriting synthesis model', sampler=synthesizer)
-
-
-def get_device():
-    dev = torch.device("cpu")
-    if torch.cuda.is_available():
-        dev = torch.device("cuda:0")
-    else:
-        try:
-            import torch_xla
-            import torch_xla.core.xla_model as xm
-            # computations on TPU are very slow for some reason
-            dev = xm.xla_device()
-        except ImportError:
-            pass
-    return dev
-
-
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(
-        description='Starts/resumes training prediction or synthesis network.'
-    )
-
-    parser.add_argument("data_dir", type=str, help="Directory containing training and validation data h5 files")
-    parser.add_argument("model_dir", type=str, help="Directory storing model weights")
-    parser.add_argument(
-        "-u", "--unconditional", default=False, action="store_true",
-        help="Whether or not to train synthesis network (synthesis network is trained by default)"
-    )
-    parser.add_argument("-b", "--batch_size", type=int, default=32, help="Batch size")
-    parser.add_argument("-e", "--epochs", type=int, default=100, help="# of epochs to train")
-    parser.add_argument("-i", "--interval", type=int, default=100, help="Iterations between sampling")
-    parser.add_argument("-c", "--charset", type=str, default='', help="Path to the charset file")
-
-    parser.add_argument("--samples_dir", type=str, default='samples',
-                        help="Path to the directory that will store samples")
-
-    parser.add_argument(
-        "--clip1", type=int, default=0,
-        help="Gradient clipping value for output layer. "
-             "When omitted or set to zero, no clipping is done."
-    )
-    parser.add_argument(
-        "--clip2", type=int, default=0,
-        help="Gradient clipping value for lstm layers. "
-             "When omitted or set to zero, no clipping is done."
-    )
-
-    args = parser.parse_args()
-
-    device = get_device()
-
-    print(f'Using device {device}')
-
-    with data.H5Dataset(f'{args.data_dir}/train.h5') as dataset:
-        mu = dataset.mu
-        sd = dataset.std
-
-    train_dataset_path = os.path.join(args.data_dir, 'train.h5')
-    val_dataset_path = os.path.join(args.data_dir, 'val.h5')
-
-    default_charset_path = os.path.join(args.data_dir, 'charset.txt')
-    charset_path = utils.get_charset_path_or_raise(args.charset, default_charset_path)
-
-    with data.NormalizedDataset(train_dataset_path, mu, sd) as train_set, \
-            data.NormalizedDataset(val_dataset_path, mu, sd) as val_set:
-        num_train_examples = len(train_set)
-        num_val_examples = len(val_set)
-        max_length = train_set.max_length
-        model_path = args.model_dir
-
-        config = ConfigOptions(batch_size=args.batch_size, epochs=args.epochs,
-                               sampling_interval=args.interval, num_train_examples=num_train_examples,
-                               num_val_examples=num_val_examples, max_length=max_length,
-                               model_path=model_path,
-                               charset_path=charset_path,
-                               samples_dir=args.samples_dir,
-                               output_clip_value=args.clip1, lstm_clip_value=args.clip2)
-
-        if args.unconditional:
-            train_unconditional_handwriting_generator(train_set, val_set, device, config)
-        else:
-            train_handwriting_synthesis_model(train_set, val_set, device, config)

From eb010d381133ad53ad96865247afd5fb4f99b423 Mon Sep 17 00:00:00 2001
From: AdoptMeTradingValues
 <108958603+AdoptMeTradingValues@users.noreply.github.com>
Date: Mon, 29 Jan 2024 21:43:42 -0500
Subject: [PATCH 2/4] Delete txt2script.py

---
 txt2script.py | 44 --------------------------------------------
 1 file changed, 44 deletions(-)
 delete mode 100644 txt2script.py

diff --git a/txt2script.py b/txt2script.py
deleted file mode 100644
index a8291ce..0000000
--- a/txt2script.py
+++ /dev/null
@@ -1,44 +0,0 @@
-import re
-import os
-import argparse
-import torch
-
-from handwriting_synthesis import utils
-from handwriting_synthesis.sampling import HandwritingSynthesizer
-
-
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(description='Converts a text file into a handwriting page.')
-    parser.add_argument("model_path", type=str, help="Path to saved model")
-    parser.add_argument(
-        "input_path", type=str, help="A path to a text file that needs to be converted to a handwriting")
-    parser.add_argument(
-        "-b", "--bias",  type=float, default=0, help="A probability bias. Unbiased sampling is performed by default."
-    )
-
-    parser.add_argument("--output_path", type=str, default='',
-                        help="Path to the generated handwriting file "
-                             "(by default, it will be saved to the current working directory "
-                             "whose name will be input_path with trailing .png extension)")
-
-    parser.add_argument(
-        "--thickness", type=int, default=10,
-        help="Handwriting thickness in pixels. It is set to 10 by default."
-    )
-
-    args = parser.parse_args()
-
-    if not os.path.isfile(args.input_path):
-        raise Exception(f'Text file not found: {args.input_path}')
-
-    base_file_name = re.sub('[^0-9a-zA-Z]+', '_', args.input_path)
-    output_path = args.output_path or f'{base_file_name}_.png'
-    thickness = args.thickness
-
-    device = torch.device("cpu")
-    synthesizer = HandwritingSynthesizer.load(args.model_path, device, args.bias)
-
-    with open(args.input_path) as f:
-        text = f.read()
-
-    utils.text_to_script(synthesizer, text, output_path, thickness=thickness)

From 68ae9cc7401dedfaf26b7bf1e523b2a86c293ad0 Mon Sep 17 00:00:00 2001
From: AdoptMeTradingValues
 <108958603+AdoptMeTradingValues@users.noreply.github.com>
Date: Mon, 29 Jan 2024 21:44:35 -0500
Subject: [PATCH 3/4] Create txt-to-script-pdf.py

---
 txt-to-script-pdf.py | 49 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 49 insertions(+)
 create mode 100644 txt-to-script-pdf.py

diff --git a/txt-to-script-pdf.py b/txt-to-script-pdf.py
new file mode 100644
index 0000000..edc109c
--- /dev/null
+++ b/txt-to-script-pdf.py
@@ -0,0 +1,49 @@
+import re
+import os
+import argparse
+import torch
+
+from handwriting_synthesis import utils
+from handwriting_synthesis.sampling import HandwritingSynthesizer
+from reportlab.pdfgen import canvas
+
+def save_as_pdf(image_path, pdf_path):
+    from PIL import Image
+    img = Image.open(image_path)
+    img.save(pdf_path, "PDF", resolution=100.0)
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='Converts a text file into a handwriting page.')
+    parser.add_argument("model_path", type=str, help="Path to saved model")
+    parser.add_argument(
+        "input_path", type=str, help="A path to a text file that needs to be converted to a handwriting")
+    parser.add_argument(
+        "-b", "--bias",  type=float, default=0, help="A probability bias. Unbiased sampling is performed by default."
+    )
+
+    parser.add_argument("--output_path", type=str, default='',
+                        help="Path to the generated handwriting file "
+                             "(by default, it will be saved to the current working directory "
+                             "whose name will be input_path with trailing .png extension)")
+
+    parser.add_argument(
+        "--thickness", type=int, default=10,
+        help="Handwriting thickness in pixels. It is set to 10 by default."
+    )
+
+    args = parser.parse_args()
+
+    if not os.path.isfile(args.input_path):
+        raise Exception(f'Text file not found: {args.input_path}')
+
+    base_file_name = re.sub('[^0-9a-zA-Z]+', '_', args.input_path)
+    output_path = args.output_path or f'{base_file_name}_.png'
+    thickness = args.thickness
+
+    device = torch.device("cpu")
+    synthesizer = HandwritingSynthesizer.load(args.model_path, device, args.bias)
+
+    with open(args.input_path) as f:
+        text = f.read()
+
+    utils.text_to_script(synthesizer, text, output_path, thickness=thickness)

From 33fc4b9d234846d4fdee2dbbf7dafd42ab2b96ed Mon Sep 17 00:00:00 2001
From: AdoptMeTradingValues
 <108958603+AdoptMeTradingValues@users.noreply.github.com>
Date: Mon, 29 Jan 2024 21:47:06 -0500
Subject: [PATCH 4/4] Update requirements.txt

---
 requirements.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/requirements.txt b/requirements.txt
index eb1d35e..c238749 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,3 +1,4 @@
+reportlab < 9
 Pillow < 10
 numpy < 2
 torch < 2