Merge pull request #171 from haskell-jp/hiw2019-gibbons

igrep · web-flow · commit 4aab0f4dc0ad · 2019-09-28T13:44:33.000+09:00
記事の追加: HIW 2019で発表された、Gibbonコンパイラーについて
diff --git a/preprocessed-site/img/2019/hiw-gibbon/tree-and-array1.svg b/preprocessed-site/img/2019/hiw-gibbon/tree-and-array1.svg
@@ -0,0 +1 @@
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:lucid="lucid" width="722" height="436"><g transform="translate(-160 -163)" lucid:page-tab-id="0_0"><path d="M540 220c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#a" transform="matrix(1,0,0,1,465,185) translate(29.537 42.754999999999995)"/><path d="M380 400c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#b" transform="matrix(1,0,0,1,305,365) translate(29.087 42.754999999999995)"/><path d="M260 540c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#c" transform="matrix(1,0,0,1,185,505) translate(28.817 42.754999999999995)"/><path d="M460 540c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#d" transform="matrix(1,0,0,1,385,505) translate(29.708 42.754999999999995)"/><path d="M720 400c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#e" transform="matrix(1,0,0,1,645,365) translate(29.258 42.754999999999995)"/><path d="M860 540c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#f" transform="matrix(1,0,0,1,785,505) translate(28.799 42.754999999999995)"/><path d="M660 540c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#g" transform="matrix(1,0,0,1,585,505) translate(30.032 42.754999999999995)"/><path d="M472.2 251.4L366.52 367.54" stroke="#000" stroke-width="2" fill="none"/><path d="M473.64 251.3l-.72.8-1.48-1.34.65-.72zM367.27 368.18l-.65.73-1.55-1.27.72-.8z"/><path d="M312.16 431.38l-71.88 71.88" stroke="#000" stroke-width="2" fill="none"/><path d="M313.64 431.3l-.8.8-1.4-1.4.65-.67zM241 503.95l-.55.56-.82-.5-1.02-.48 1-1z"/><path d="M360.8 436.4l38.4 67.2" stroke="#000" stroke-width="2" fill="none"/><path d="M361.68 435.93l-1.73 1-.52-.9 1.75-.98zM400.57 503.97l-1.75.98-.5-.88 1.73-1z"/><path d="M530.7 248.65l120.15 121.22" stroke="#000" stroke-width="2" fill="none"/><path d="M531.44 247.97l-1.42 1.4-.74-.74.73-.7.64-.76zM652.28 369.9l-1.45 1.37-.7-.72 1.4-1.4z"/><path d="M655.38 434l-34.9 64.12" stroke="#000" stroke-width="2" fill="none"/><path d="M656.03 433.27l.66.4-.46.83-1.76-.95.6-1.07zM621.37 498.58l-.27.5-1.1-.08-1.16.04.77-1.42z"/><path d="M713.17 425.65l81.18 81.18" stroke="#000" stroke-width="2" fill="none"/><path d="M713.9 424.96l-1.4 1.42-.67-.66 1.27-1.55zM795.88 506.94l-1.63 1.2-.62-.62 1.4-1.4z"/><defs><path d="M191-298h222c-37-120-75-237-109-360h-4c-33 124-71 241-109 360zM506 0l-70-224H168L97 0H3l249-733h103L604 0h-98" id="h"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#h" id="a"/><path d="M100 0v-733h218c149 0 252 50 252 179 0 73-39 137-108 159v5c88 17 150 75 150 175C612-71 498 0 334 0H100zm93-421h109c126 0 177-47 177-121 0-86-59-118-173-118H193v239zm0 347h128c126 0 200-45 200-144 0-91-72-132-200-132H193v276" id="i"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#i" id="b"/><path d="M100 0v-733h184c225 0 346 131 346 364C630-137 509 0 288 0H100zm93-76h83c173 0 258-108 258-293 0-186-85-289-258-289h-83v582" id="j"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#j" id="c"/><path d="M100 0v-733h423v78H193v230h278v79H193v267h341V0H100" id="k"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#k" id="d"/><path d="M377 13C195 13 58-128 58-366c0-237 139-381 325-381 89 0 159 44 201 91l-50 60c-38-41-87-70-150-70-139 0-231 114-231 297 0 185 88 301 228 301 70 0 123-31 170-82l51 58C544-25 472 13 377 13" id="l"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#l" id="e"/><path d="M388 13C195 13 58-128 58-366c0-237 142-381 336-381 102 0 169 46 211 91l-50 60c-37-39-84-70-159-70-147 0-243 114-243 297 0 185 87 301 244 301 53 0 104-16 133-43v-192H375v-77h240v308c-47 49-128 85-227 85" id="m"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#m" id="f"/><path d="M100 0v-733h423v78H193v248h280v78H193V0h-93" id="n"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#n" id="g"/></defs></g></svg>
diff --git a/preprocessed-site/img/2019/hiw-gibbon/tree-and-array2.svg b/preprocessed-site/img/2019/hiw-gibbon/tree-and-array2.svg
@@ -0,0 +1 @@
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:lucid="lucid" width="732" height="446"><g transform="translate(-166 -636)" lucid:page-tab-id="0_0"><path d="M472 704.04l-98.73 98.7 8.02 8.03-30.46-1.6-1.6-30.46 8 8.03L455.97 688z" stroke="#000" stroke-opacity="0" stroke-width="2" fill="#c92d39" fill-opacity=".85"/><path d="M560 700c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#a" transform="matrix(1,0,0,1,485,665) translate(29.537 42.754999999999995)"/><path d="M400 880c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#b" transform="matrix(1,0,0,1,325,845) translate(29.087 42.754999999999995)"/><path d="M280 1020c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#c" transform="matrix(1,0,0,1,205,985) translate(28.817 42.754999999999995)"/><path d="M480 1020c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#d" transform="matrix(1,0,0,1,405,985) translate(29.708 42.754999999999995)"/><path d="M740 880c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#e" transform="matrix(1,0,0,1,665,845) translate(29.258 42.754999999999995)"/><path d="M880 1020c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#f" transform="matrix(1,0,0,1,805,985) translate(28.799 42.754999999999995)"/><path d="M680 1020c0 22.1-17.9 40-40 40s-40-17.9-40-40 17.9-40 40-40 40 17.9 40 40z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#g" transform="matrix(1,0,0,1,605,985) translate(30.032 42.754999999999995)"/><path d="M492.2 731.4L386.52 847.54" stroke="#000" stroke-width="2" fill="none"/><path d="M493.64 731.3l-.72.8-1.48-1.34.65-.72zM387.27 848.18l-.65.73-1.55-1.27.72-.8z"/><path d="M332.16 911.38l-71.88 71.88" stroke="#000" stroke-width="2" fill="none"/><path d="M333.64 911.3l-.8.8-1.4-1.4.65-.67zM261 983.95l-.55.56-.82-.5-1.02-.48 1-1z"/><path d="M380.8 916.4l38.4 67.2" stroke="#000" stroke-width="2" fill="none"/><path d="M381.68 915.93l-1.73 1-.52-.9 1.75-.98zM420.57 983.97l-1.75.98-.5-.88 1.73-1z"/><path d="M550.7 728.65l120.15 121.22" stroke="#000" stroke-width="2" fill="none"/><path d="M551.44 727.97l-1.42 1.4-.74-.74.73-.7.64-.76zM672.28 849.9l-1.45 1.37-.7-.72 1.4-1.4z"/><path d="M675.38 914l-34.9 64.12" stroke="#000" stroke-width="2" fill="none"/><path d="M676.03 913.27l.66.4-.46.83-1.76-.95.6-1.07zM641.37 978.58l-.27.5-1.1-.08-1.16.04.77-1.42z"/><path d="M733.17 905.65l81.18 81.18" stroke="#000" stroke-width="2" fill="none"/><path d="M733.9 904.96l-1.4 1.42-.67-.66 1.27-1.55zM815.88 986.94l-1.63 1.2-.62-.62 1.4-1.4z"/><path d="M304.58 864.04l-98.7 98.7 8 8.03-30.45-1.6-1.6-30.46 8 8.03L288.56 848zM295 1008.67h69.6v-11.34L385 1020l-20.4 22.67v-11.34H295zM489.95 980.08l136.72-79.6-5.7-9.8L650 900l-6.22 29.85-5.7-9.8-136.73 79.62zM700 1008.67h69.6v-11.34L790 1020l-20.4 22.67v-11.34H700zM714.12 937.17l-14.62 30 10.2 4.96-29.33 8.4-11.43-28.27 10.2 4.97 14.6-30z" stroke="#000" stroke-opacity="0" stroke-width="2" fill="#c92d39" fill-opacity=".85"/><defs><path d="M191-298h222c-37-120-75-237-109-360h-4c-33 124-71 241-109 360zM506 0l-70-224H168L97 0H3l249-733h103L604 0h-98" id="h"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#h" id="a"/><path d="M100 0v-733h218c149 0 252 50 252 179 0 73-39 137-108 159v5c88 17 150 75 150 175C612-71 498 0 334 0H100zm93-421h109c126 0 177-47 177-121 0-86-59-118-173-118H193v239zm0 347h128c126 0 200-45 200-144 0-91-72-132-200-132H193v276" id="i"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#i" id="b"/><path d="M100 0v-733h184c225 0 346 131 346 364C630-137 509 0 288 0H100zm93-76h83c173 0 258-108 258-293 0-186-85-289-258-289h-83v582" id="j"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#j" id="c"/><path d="M100 0v-733h423v78H193v230h278v79H193v267h341V0H100" id="k"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#k" id="d"/><path d="M377 13C195 13 58-128 58-366c0-237 139-381 325-381 89 0 159 44 201 91l-50 60c-38-41-87-70-150-70-139 0-231 114-231 297 0 185 88 301 228 301 70 0 123-31 170-82l51 58C544-25 472 13 377 13" id="l"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#l" id="e"/><path d="M388 13C195 13 58-128 58-366c0-237 142-381 336-381 102 0 169 46 211 91l-50 60c-37-39-84-70-159-70-147 0-243 114-243 297 0 185 87 301 244 301 53 0 104-16 133-43v-192H375v-77h240v308c-47 49-128 85-227 85" id="m"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#m" id="f"/><path d="M100 0v-733h423v78H193v248h280v78H193V0h-93" id="n"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#n" id="g"/></defs></g></svg>
diff --git a/preprocessed-site/img/2019/hiw-gibbon/tree-and-array3.svg b/preprocessed-site/img/2019/hiw-gibbon/tree-and-array3.svg
@@ -0,0 +1 @@
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:lucid="lucid" width="615" height="122"><g transform="translate(-143 -1096)" lucid:page-tab-id="0_0"><path d="M167.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#a" transform="matrix(1,0,0,1,172.4037037981907,1125) translate(29.537 42.754999999999995)"/><path d="M247.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#b" transform="matrix(1,0,0,1,252.4037037981907,1125) translate(29.087 42.754999999999995)"/><path d="M327.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#c" transform="matrix(1,0,0,1,332.40370379818114,1125) translate(28.817 42.754999999999995)"/><path d="M407.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#d" transform="matrix(1,0,0,1,412.4037037981716,1125) translate(29.708 42.754999999999995)"/><path d="M487.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#e" transform="matrix(1,0,0,1,492.40370379816204,1125) translate(29.258 42.754999999999995)"/><path d="M567.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#f" transform="matrix(1,0,0,1,572.4037037981525,1125) translate(30.032 42.754999999999995)"/><path d="M647.4 1120h80v80h-80z" stroke="#000" stroke-width="2" fill="#fff"/><use xlink:href="#g" transform="matrix(1,0,0,1,652.4037037981429,1125) translate(28.799 42.754999999999995)"/><defs><path d="M191-298h222c-37-120-75-237-109-360h-4c-33 124-71 241-109 360zM506 0l-70-224H168L97 0H3l249-733h103L604 0h-98" id="h"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#h" id="a"/><path d="M100 0v-733h218c149 0 252 50 252 179 0 73-39 137-108 159v5c88 17 150 75 150 175C612-71 498 0 334 0H100zm93-421h109c126 0 177-47 177-121 0-86-59-118-173-118H193v239zm0 347h128c126 0 200-45 200-144 0-91-72-132-200-132H193v276" id="i"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#i" id="b"/><path d="M100 0v-733h184c225 0 346 131 346 364C630-137 509 0 288 0H100zm93-76h83c173 0 258-108 258-293 0-186-85-289-258-289h-83v582" id="j"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#j" id="c"/><path d="M100 0v-733h423v78H193v230h278v79H193v267h341V0H100" id="k"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#k" id="d"/><path d="M377 13C195 13 58-128 58-366c0-237 139-381 325-381 89 0 159 44 201 91l-50 60c-38-41-87-70-150-70-139 0-231 114-231 297 0 185 88 301 228 301 70 0 123-31 170-82l51 58C544-25 472 13 377 13" id="l"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#l" id="e"/><path d="M100 0v-733h423v78H193v248h280v78H193V0h-93" id="m"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#m" id="f"/><path d="M388 13C195 13 58-128 58-366c0-237 142-381 336-381 102 0 169 46 211 91l-50 60c-37-39-84-70-159-70-147 0-243 114-243 297 0 185 87 301 244 301 53 0 104-16 133-43v-192H375v-77h240v308c-47 49-128 85-227 85" id="n"/><use transform="matrix(0.018,0,0,0.018,0,0)" xlink:href="#n" id="g"/></defs></g></svg>
diff --git a/preprocessed-site/posts/2019/hiw-gibbon.md b/preprocessed-site/posts/2019/hiw-gibbon.md
@@ -0,0 +1,93 @@
+---
+title: HIW 2019で発表された、Gibbonコンパイラーについて
+subHeading: ～HIW 2019参加レポート その3～
+headingBackgroundImage: ../../img/background.png
+headingDivClass: post-heading
+author: Yuji Yamamoto
+postedBy: <a href="http://the.igreque.info/">Yuji Yamamoto(@igrep)</a>
+date: September 28, 2019
+tags: Haskell Implementors' Workshop
+...
+---
+
+[前回](/posts/2019/hiw-ghc-future.html)から引き続き、[Haskell Implementors' Workshop 2019](https://icfp19.sigplan.org/home/hiw-2019#About)への参加レポートとして、私の印象に残った発表を紹介します。  
+今回は、[Gibbon](http://iu-parfunc.github.io/gibbon/)という、GHC以外のHaskell<small>（の、サブセット）</small>の処理系についての発表です。
+
+# The Gibbon Compiler: Accelerating a small subset of Haskell
+
+発表者: Ryan R. Newton *Indiana University*, Michael Vollmer *Indiana University, USA*, Chaitanya Koparkar *Indiana University*
+
+Gibbonは最適化の手法を研究するために作られたコンパイラーです。  
+具体的には、我々<small>（特にHaskeller）</small>がよく使う、木構造全体に対する処理の最適化です。
+
+こうした木構造のデータは、通常ポインターを使ってメモリー内にバラバラに格納されますが、Gibbonによる最適化を行うと、実際にプログラムがどのような順番で木を処理しているのか解析して、（元のデータ構造を配列に変換した上で）その順番に並べられた配列として処理するコードに変換する、という大胆な変換を行います。
+図にするとこんなイメージでしょうか？
+
+![変換前の木構造。各ノードがそれぞれ（レベル順で）A, B, ... , Gという値を持っている](/img/2019/hiw-gibbon/tree-and-array1.svg)
+
+👆のような木構造があったとして、
+
+![行きがけ順（A, B, D, E, C, F, Gの順）でアクセスする](/img/2019/hiw-gibbon/tree-and-array2.svg)
+
+👆における、赤い線の順番<small>（行きがけ順）</small>にアクセスする関数があったとします。  
+適当にHaskellの再帰関数として書くと、👇こういうコードです。
+
+```haskell
+data Tree = Node Char (Maybe Tree) (Maybe Tree) deriving Show
+
+tree :: Tree
+tree =
+  Node 'A'
+    ( Just
+      ( Node 'B'
+        (Just (Node 'D' Nothing Nothing))
+        (Just (Node 'E' Nothing Nothing))
+      )
+    )
+    ( Just
+      ( Node 'C'
+        (Just (Node 'F' Nothing Nothing))
+        (Just (Node 'G' Nothing Nothing))
+      )
+    )
+
+preOrder :: (Char -> IO ()) -> Tree -> IO ()
+preOrder access (Node char mLeft mRight) = do
+  access char
+
+  case mLeft of
+    Just left -> preOrder access left
+    Nothing -> return ()
+
+  case mRight of
+    Just right -> preOrder access right
+    Nothing -> return ()
+```
+
+Gibbonはこの関数と、それが処理する木構造を解析して、
+
+![変換された配列。A, B, D, E, C, F, Gの順に要素が並んだただの配列](/img/2019/hiw-gibbon/tree-and-array3.svg)
+
+👆のような、ただの配列（とそれに対する関数）にまとめて変換してしまう、というのです！
+
+現代のコンピューターは、このような配列の要素にまとめてアクセス処理する方が、ポインターをたどって各要素を処理するより、たいてい遙かに速いです。  
+Gibbonはこの特性を活かすべく、我々Haskellerが好んで使うような、ポインターだらけの木構造を可能な限り配列に変換することで、要素をまとめて処理する（traverseする）演算の最適化を図るコンパイラーです。
+
+ちなみに、元の木に対するノードの追加に相当する処理は、新しいノードに対するポインターを書き込む処理に変換するそうです。  
+なので何度も追加を繰り返すと、あまり恩恵が受けられなくなってしまいそうです。
+
+なかなか興味深いアイディアですが、個人的に聞きそびれた疑問が2つあります。  
+一つは、そもそも木構造を定義するような状況というのは、いろいろな順番でアクセスしたいし、新しい要素の追加も繰り返し行いたいケースではないでしょうか？  
+例えば[unordered-containers](http://hackage.haskell.org/package/unordered-containers)にある`HashMap`型は探索木を使った頻繁に使われるデータ構造ですが、`HashMap`を使う場合に行う処理の多くは、ランダムアクセスや要素の追加・削除でしょう。
+
+なので、Gibbonが最適化したい「木構造」というのは、どちらかというと探索木のような木ではなく、構文木のような、要素をまとめて処理することを前提とした木のことなのかもしれません。  
+確かに人間が書く言語の構文木程度であれば、すべてメモリー上で処理できる程度のサイズに収まる<small>（という想定でなければコンパイラー作りがものすごく難しくなる）</small>でしょうし、構文木の処理を高速化できれば、遅い遅いと言われるGHCのコンパイル速度も高められるはずです。それはそれでありがたい。
+
+もう一つは、これまた例えば`HashMap`型のような木をベースにした連想配列も、配列ベースのハッシュテーブルに変換することができるのでしょうか？  
+もしそうだとすると、ランダムアクセスに対する計算量のオーダーもO(log n)からO(1)に変わるわけですし、要素をまとめて処理する以外の演算についても劇的な改善が見込めるかもしれません。  
+もちろんこれも先ほどの推測が正しければ無意味な想像ですが、夢のある話ですね。
+
+Gibbonは将来的には、`Packed`という型クラスを提供することで、GHC本体への統合も視野に入れているそうです。  
+`Packed`を実装した型は、値をどのように配列に変換するのか定義することで、Gibbonによる最適化のためのヒントを与えることができます。
+
+参考: [木構造 (データ構造) - Wikipedia](https://ja.wikipedia.org/w/index.php?title=%E6%9C%A8%E6%A7%8B%E9%80%A0_\(%E3%83%87%E3%83%BC%E3%82%BF%E6%A7%8B%E9%80%A0\)&oldid=72655479)