From b8410d15e9094dc2b93fde662f079e183ac01218 Mon Sep 17 00:00:00 2001
From: Amaras <amaras@vivaldi.net>
Date: Sun, 12 Jul 2020 18:30:35 +0200
Subject: [PATCH 1/6] Re-added Huffman encoding in Coconut

---
 .../code/coconut/huffman.coco                 | 112 ++++++++++++++++++
 contents/huffman_encoding/huffman_encoding.md |   2 +
 2 files changed, 114 insertions(+)
 create mode 100644 contents/huffman_encoding/code/coconut/huffman.coco

diff --git a/contents/huffman_encoding/code/coconut/huffman.coco b/contents/huffman_encoding/code/coconut/huffman.coco
new file mode 100644
index 000000000..f93f2e915
--- /dev/null
+++ b/contents/huffman_encoding/code/coconut/huffman.coco
@@ -0,0 +1,112 @@
+# Huffman Encoding
+# Coconut
+# Submitted by Amaras
+# Inspired by Matthew Giallourakis
+
+from collections import Counter, deque
+from bisect import bisect
+
+class Tree
+
+data Empty() from Tree
+data Leaf(char, n is int) from Tree:
+    def __str__(self):
+        return f'Leaf({self.char}, {self.n})'
+
+    __repr__ = __str__
+
+data Node(left is Tree, right is Tree) from Tree:
+    def __str__(self):
+        return f'Node({str(self.left)}, {str(self.right)})'
+    __repr__ = __str__
+
+def weight(Tree()) = 0
+addpattern def weight(Leaf(char, n)) = n
+addpattern def weight(Node(left, right)) = weight(left) + weight(right)
+
+# constructs the tree
+def build_huffman_tree(message):
+
+    # get sorted list of character and frequency pairs
+    frequencies = Counter(message)
+    trees = frequencies.most_common() |> map$(t -> Leaf(*t)) |> reversed |> deque
+
+    # while there is more than one tree
+    while len(trees) > 1:
+        print(trees)
+
+        # pop off the two trees of least weight from the trees list
+        tree_left = trees.popleft()
+        tree_right = trees.popleft()
+
+        # combine the nodes and add back to the nodes list
+        new_tree = Node(tree_left, tree_right)
+
+        # find the first tree that has a weight smaller than new_weight and returns its index in the list
+        # If no such tree can be found, use len(trees) instead to append
+        index = bisect(trees |> map$(weight) |> list, weight(new_tree))
+
+        # insert the new tree there
+        trees.insert(index, new_tree)
+
+    huffman_tree = trees[0]
+    return huffman_tree
+
+
+def build_codebook(Empty(), code='') = []
+addpattern def build_codebook(Leaf(char, n), code='') = [(char, code)]
+addpattern def build_codebook(Node(left, right), code='') = build_codebook(left, code+'0') + build_codebook(right, code+'1')
+
+# encodes the message
+def huffman_encode(codebook, message):
+
+    # build a char -> code dictionary
+    forward_dict = dict(codebook)
+
+    return ''.join(message |> forward_dict[])
+
+# decodes a message
+def huffman_decode(codebook, encoded_message):
+
+    decoded_message = []
+    key = ''
+
+    # build a code -> char dictionary
+    inverse_dict = dict([(v, k) for k, v in codebook])
+
+    # for each bit in the encoding
+    # if the bit is in the dictionary, replace the bit with the paired character
+    # else look at the bit and the following bits together until a match occurs
+    # move to the next bit not yet looked at
+    for index, bit in enumerate(encoded_message):
+        key += bit
+        if key in inverse_dict:
+            decoded_message.append(inverse_dict[key])
+            key = ''
+
+    return ''.join(decoded_message)
+
+
+if __name__ == '__main__':
+    # test example
+    message = 'bibbity_bobbity'
+    tree = build_huffman_tree(message)
+    codebook = build_codebook(tree)
+    encoded_message = huffman_encode(codebook, message)
+    decoded_message = huffman_decode(codebook, encoded_message)
+
+    print('message:', message)
+    print('huffman tree:', tree)
+    print('codebook:', codebook)
+    print('encoded message:', encoded_message)
+    print('decoded message:', decoded_message)
+
+    # prints the following:
+    #
+    #  message: bibbity_bobbity
+    #  huffman_tree: Node(Leaf(b, 6), Node(Node(Leaf(y, 2), Leaf(t, 2)),
+    #                     Node(Node(Leaf(o, 1), Leaf(_, 1)), Leaf(i, 3))))
+    #  codebook: [('b', '0'), ('y', '100'), ('t', '101'),
+    #             ('o', '1100'), ('_', '1101'), ('i', '111')]
+    #  encoded_message: 01110011110110011010110000111101100
+    #  decoded_message: bibbity_bobbity
diff --git a/contents/huffman_encoding/huffman_encoding.md b/contents/huffman_encoding/huffman_encoding.md
index 885a81ab4..7a2fb4034 100644
--- a/contents/huffman_encoding/huffman_encoding.md
+++ b/contents/huffman_encoding/huffman_encoding.md
@@ -93,6 +93,8 @@ Whether you use a stack or straight-up recursion also depends on the language, b
 [import, lang:"asm-x64"](code/asm-x64/huffman.s)
 {% sample lang="scala" %}
 [import, lang:"scala"](code/scala/huffman_encoding.scala)
+{% sample lang="coco" %}
+[import, lang:"coconut"](code/coconut/huffman.coco)
 {% endmethod %}
 
 <script>

From d64bf495ced369b195cc1305ce046ee1be1b6949 Mon Sep 17 00:00:00 2001
From: Amaras <amaras@vivaldi.net>
Date: Mon, 20 Jul 2020 00:08:40 +0200
Subject: [PATCH 2/6] removed the unnecessary print

---
 contents/huffman_encoding/code/coconut/huffman.coco | 1 -
 1 file changed, 1 deletion(-)

diff --git a/contents/huffman_encoding/code/coconut/huffman.coco b/contents/huffman_encoding/code/coconut/huffman.coco
index f93f2e915..eebc1d76d 100644
--- a/contents/huffman_encoding/code/coconut/huffman.coco
+++ b/contents/huffman_encoding/code/coconut/huffman.coco
@@ -33,7 +33,6 @@ def build_huffman_tree(message):
 
     # while there is more than one tree
     while len(trees) > 1:
-        print(trees)
 
         # pop off the two trees of least weight from the trees list
         tree_left = trees.popleft()

From c4fb8c63b4ca70f30b4f82b4d67f42ce827395fd Mon Sep 17 00:00:00 2001
From: Amaras <amaras@vivaldi.net>
Date: Thu, 6 Aug 2020 13:37:40 +0200
Subject: [PATCH 3/6] Added partial patch to edge cases and improved the code

---
 .../huffman_encoding/code/coconut/huffman.coco    | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/contents/huffman_encoding/code/coconut/huffman.coco b/contents/huffman_encoding/code/coconut/huffman.coco
index eebc1d76d..1d4c45657 100644
--- a/contents/huffman_encoding/code/coconut/huffman.coco
+++ b/contents/huffman_encoding/code/coconut/huffman.coco
@@ -31,6 +31,9 @@ def build_huffman_tree(message):
     frequencies = Counter(message)
     trees = frequencies.most_common() |> map$(t -> Leaf(*t)) |> reversed |> deque
 
+    if not trees:
+        return Empty()
+
     # while there is more than one tree
     while len(trees) > 1:
 
@@ -62,7 +65,7 @@ def huffman_encode(codebook, message):
     # build a char -> code dictionary
     forward_dict = dict(codebook)
 
-    return ''.join(message |> forward_dict[])
+    return ''.join(message |> map$(forward_dict[]))
 
 # decodes a message
 def huffman_decode(codebook, encoded_message):
@@ -70,14 +73,20 @@ def huffman_decode(codebook, encoded_message):
     decoded_message = []
     key = ''
 
+    if not codebook:
+        return ''
+
     # build a code -> char dictionary
-    inverse_dict = dict([(v, k) for k, v in codebook])
+    inverse_dict = dict((v, k) for k, v in codebook)
 
     # for each bit in the encoding
     # if the bit is in the dictionary, replace the bit with the paired character
     # else look at the bit and the following bits together until a match occurs
     # move to the next bit not yet looked at
-    for index, bit in enumerate(encoded_message):
+    if encoded_message == '':
+        return inverse_dict['']
+
+    for bit in encoded_message:
         key += bit
         if key in inverse_dict:
             decoded_message.append(inverse_dict[key])

From 7cec66e20c4e635d8b62bf97e18599dcc50cf4b0 Mon Sep 17 00:00:00 2001
From: Amaras <amaras@vivaldi.net>
Date: Thu, 6 Aug 2020 22:01:47 +0200
Subject: [PATCH 4/6] Added edge case support

---
 contents/huffman_encoding/code/coconut/huffman.coco | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/contents/huffman_encoding/code/coconut/huffman.coco b/contents/huffman_encoding/code/coconut/huffman.coco
index 1d4c45657..ebbd5e2b9 100644
--- a/contents/huffman_encoding/code/coconut/huffman.coco
+++ b/contents/huffman_encoding/code/coconut/huffman.coco
@@ -62,6 +62,9 @@ addpattern def build_codebook(Node(left, right), code='') = build_codebook(left,
 # encodes the message
 def huffman_encode(codebook, message):
 
+    if len(codebook) == 1:
+        return '0' * len(message)
+
     # build a char -> code dictionary
     forward_dict = dict(codebook)
 
@@ -75,6 +78,8 @@ def huffman_decode(codebook, encoded_message):
 
     if not codebook:
         return ''
+    elif len(codebook) == 1:
+        return codebook[0][0] * len(encoded_message)
 
     # build a code -> char dictionary
     inverse_dict = dict((v, k) for k, v in codebook)

From 43d4f76582fe5c7fb9d9a84483e71e0440174b7a Mon Sep 17 00:00:00 2001
From: Sammy Plat <amaras@vivaldi.net>
Date: Thu, 9 Sep 2021 15:41:30 +0200
Subject: [PATCH 5/6] Shortened overly long lines

---
 contents/huffman_encoding/code/coconut/huffman.coco | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/contents/huffman_encoding/code/coconut/huffman.coco b/contents/huffman_encoding/code/coconut/huffman.coco
index ebbd5e2b9..7d13fb307 100644
--- a/contents/huffman_encoding/code/coconut/huffman.coco
+++ b/contents/huffman_encoding/code/coconut/huffman.coco
@@ -44,7 +44,8 @@ def build_huffman_tree(message):
         # combine the nodes and add back to the nodes list
         new_tree = Node(tree_left, tree_right)
 
-        # find the first tree that has a weight smaller than new_weight and returns its index in the list
+        # find the first tree that has a weight smaller than new_weight
+        # and returns its index in the list.
         # If no such tree can be found, use len(trees) instead to append
         index = bisect(trees |> map$(weight) |> list, weight(new_tree))
 
@@ -57,7 +58,8 @@ def build_huffman_tree(message):
 
 def build_codebook(Empty(), code='') = []
 addpattern def build_codebook(Leaf(char, n), code='') = [(char, code)]
-addpattern def build_codebook(Node(left, right), code='') = build_codebook(left, code+'0') + build_codebook(right, code+'1')
+addpattern def build_codebook(Node(left, right), code='') = 
+    build_codebook(left, code+'0') + build_codebook(right, code+'1')
 
 # encodes the message
 def huffman_encode(codebook, message):
@@ -85,9 +87,9 @@ def huffman_decode(codebook, encoded_message):
     inverse_dict = dict((v, k) for k, v in codebook)
 
     # for each bit in the encoding
-    # if the bit is in the dictionary, replace the bit with the paired character
-    # else look at the bit and the following bits together until a match occurs
-    # move to the next bit not yet looked at
+    # if the bit is in the dictionary, replace the bit with the paired
+    # character else look at the bit and the following bits together
+    # until a match occurs move to the next bit not yet looked at.
     if encoded_message == '':
         return inverse_dict['']
 

From 90f0c96a8fe7b23e338b499c71a94aeafac1c4fc Mon Sep 17 00:00:00 2001
From: Sammy Plat <amaras@vivaldi.net>
Date: Thu, 9 Sep 2021 16:43:05 +0200
Subject: [PATCH 6/6] removed the useless comments

---
 contents/huffman_encoding/code/coconut/huffman.coco | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/contents/huffman_encoding/code/coconut/huffman.coco b/contents/huffman_encoding/code/coconut/huffman.coco
index 7d13fb307..640112167 100644
--- a/contents/huffman_encoding/code/coconut/huffman.coco
+++ b/contents/huffman_encoding/code/coconut/huffman.coco
@@ -1,8 +1,3 @@
-# Huffman Encoding
-# Coconut
-# Submitted by Amaras
-# Inspired by Matthew Giallourakis
-
 from collections import Counter, deque
 from bisect import bisect
 
@@ -24,7 +19,6 @@ def weight(Tree()) = 0
 addpattern def weight(Leaf(char, n)) = n
 addpattern def weight(Node(left, right)) = weight(left) + weight(right)
 
-# constructs the tree
 def build_huffman_tree(message):
 
     # get sorted list of character and frequency pairs
@@ -61,7 +55,6 @@ addpattern def build_codebook(Leaf(char, n), code='') = [(char, code)]
 addpattern def build_codebook(Node(left, right), code='') = 
     build_codebook(left, code+'0') + build_codebook(right, code+'1')
 
-# encodes the message
 def huffman_encode(codebook, message):
 
     if len(codebook) == 1:
@@ -72,7 +65,6 @@ def huffman_encode(codebook, message):
 
     return ''.join(message |> map$(forward_dict[]))
 
-# decodes a message
 def huffman_decode(codebook, encoded_message):
 
     decoded_message = []