# HG changeset patch # User Yuhi TOMARI # Date 1424080144 -32400 # Node ID 14478d9ce501e4ca62813dc3d3b39345bdc1f547 # Parent 9334c3e08e49200f03635063c02e843903b2cd45 fix diff -r 9334c3e08e49 -r 14478d9ce501 paper/master_paper.aux --- a/paper/master_paper.aux Mon Feb 16 18:47:47 2015 +0900 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,153 +0,0 @@ -\relax -\@writefile{toc}{\contentsline {chapter}{\numberline {第1章}マルチプラットフォームなフレームワークにおける並列プログラミング}{1}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {chapter}{\numberline {第2章}既存のマルチプラットフォームフレームワーク}{3}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {2.1}GPU/Cell の Architecture}{3}} -\newlabel{sec:shared_memory}{{2.1}{3}} -\@writefile{lof}{\contentsline {figure}{\numberline {2.1}{\ignorespaces GPU Architecture}}{4}} -\newlabel{fig:gpuarch}{{2.1}{4}} -\@writefile{lof}{\contentsline {figure}{\numberline {2.2}{\ignorespaces CPU Architecture}}{4}} -\newlabel{fig:cpuarch}{{2.2}{4}} -\@writefile{lof}{\contentsline {figure}{\numberline {2.3}{\ignorespaces Cell Architecture}}{5}} -\newlabel{fig:cell_arch}{{2.3}{5}} -\@writefile{toc}{\contentsline {section}{\numberline {2.2}OpenCL}{5}} -\@writefile{toc}{\contentsline {section}{\numberline {2.3}CUDA}{6}} -\@writefile{toc}{\contentsline {section}{\numberline {2.4}StarPU}{6}} -\newlabel{src:codelet}{{2.1}{7}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {2.1}codeletの例}{7}} -\@writefile{toc}{\contentsline {section}{\numberline {2.5}Cell Broadband Engine}{7}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第3章}並列プログラミングフレームワーク Cerium}{8}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {3.1}Cerium の概要}{8}} -\@writefile{toc}{\contentsline {section}{\numberline {3.2}Cerium TaskManager}{8}} -\newlabel{src:createTask}{{3.1}{8}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {3.1}Task の生成}{8}} -\@writefile{lot}{\contentsline {table}{\numberline {3.1}{\ignorespaces Task 生成おける API}}{9}} -\newlabel{table:task_create_api}{{3.1}{9}} -\newlabel{src:task}{{3.2}{9}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {3.2}Task}{9}} -\@writefile{lot}{\contentsline {table}{\numberline {3.2}{\ignorespaces Task 側で使用する API}}{9}} -\newlabel{table:task_api}{{3.2}{9}} -\@writefile{toc}{\contentsline {section}{\numberline {3.3}Cerium における Task}{10}} -\@writefile{lof}{\contentsline {figure}{\numberline {3.1}{\ignorespaces Task Manager}}{10}} -\newlabel{fig:taskmanager}{{3.1}{10}} -\@writefile{toc}{\contentsline {section}{\numberline {3.4}Task の Scheduling}{11}} -\@writefile{lof}{\contentsline {figure}{\numberline {3.2}{\ignorespaces Scheduler}}{11}} -\newlabel{fig:scheduler}{{3.2}{11}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第4章}Ceriumを用いた例題}{12}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {4.1}Bitonic Sort}{12}} -\@writefile{lof}{\contentsline {figure}{\numberline {4.1}{\ignorespaces Bitonic Sort の例}}{13}} -\newlabel{fig:sort}{{4.1}{13}} -\@writefile{toc}{\contentsline {section}{\numberline {4.2}Word Count}{14}} -\@writefile{lof}{\contentsline {figure}{\numberline {4.2}{\ignorespaces WordCountのフロー}}{15}} -\newlabel{fig:wordcount}{{4.2}{15}} -\@writefile{toc}{\contentsline {section}{\numberline {4.3}FFT}{16}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第5章}マルチコアへの対応}{17}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {5.1}マルチコア上での実行の機構}{17}} -\@writefile{toc}{\contentsline {section}{\numberline {5.2}DMA}{17}} -\@writefile{toc}{\contentsline {section}{\numberline {5.3}データ並列}{17}} -\newlabel{sec:multicore_dataparallel}{{5.3}{17}} -\@writefile{lot}{\contentsline {table}{\numberline {5.1}{\ignorespaces データ並列実行時の index の割り当て}}{18}} -\newlabel{table:dataparallel_index}{{5.1}{18}} -\newlabel{src:multiply_cpu}{{5.1}{18}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {5.1}Multiply(CPU)}{18}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第6章}GPGPU への対応}{20}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {6.1}OpenCL および CUDA による実装}{20}} -\@writefile{toc}{\contentsline {section}{\numberline {6.2}データ並列}{21}} -\newlabel{src:multiply_opencl}{{6.1}{21}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {6.1}Multiply(OpenCL)}{21}} -\newlabel{src:multiply_cuda}{{6.2}{21}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {6.2}Multiply(CUDA)}{21}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第7章}並列処理向けI/O}{23}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {7.1}mmap}{23}} -\@writefile{lof}{\contentsline {figure}{\numberline {7.1}{\ignorespaces mmap の Model}}{23}} -\newlabel{fig:mmap}{{7.1}{23}} -\@writefile{toc}{\contentsline {section}{\numberline {7.2}Blocked Read による I/O の並列化}{24}} -\@writefile{lof}{\contentsline {figure}{\numberline {7.2}{\ignorespaces BlockedRead による WordCount}}{24}} -\newlabel{fig:blockedread}{{7.2}{24}} -\newlabel{src:blockedread_create}{{7.1}{25}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {7.1}BlockedRead を行う Task の生成}{25}} -\newlabel{src:blockedread_task}{{7.2}{25}} -\@writefile{lol}{\contentsline {lstlisting}{\numberline {7.2}BlockedRead Task}{25}} -\@writefile{toc}{\contentsline {section}{\numberline {7.3}I/O 専用 Thread の実装}{26}} -\newlabel{sec:spe_problem}{{7.3}{26}} -\@writefile{lof}{\contentsline {figure}{\numberline {7.3}{\ignorespaces BlockedRead と Task を同じ thread で動かした場合}}{26}} -\newlabel{fig:spe_any_blockedread}{{7.3}{26}} -\@writefile{lof}{\contentsline {figure}{\numberline {7.4}{\ignorespaces IO Thread による BlockedRead}}{26}} -\newlabel{fig:iothread__blockedread}{{7.4}{26}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第8章}ベンチマーク}{27}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {8.1}実験環境}{27}} -\@writefile{lot}{\contentsline {table}{\numberline {8.1}{\ignorespaces Ceriumを実行する実験環境1}}{27}} -\newlabel{tab:firefly_spec}{{8.1}{27}} -\@writefile{lot}{\contentsline {table}{\numberline {8.2}{\ignorespaces Ceriumを実行する実験環境2}}{27}} -\newlabel{tab:dragonfly_spec}{{8.2}{27}} -\@writefile{toc}{\contentsline {section}{\numberline {8.2}マルチコア}{28}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.1}{\ignorespaces マルチコア CPU における Sort}}{28}} -\newlabel{fig:sort_on_multicore}{{8.1}{28}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.2}{\ignorespaces マルチコア CPU における WordCount}}{29}} -\newlabel{fig:wordcount_on_multicore}{{8.2}{29}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.3}{\ignorespaces Word Count による prefetch機能のベンチマーク}}{29}} -\newlabel{fig:prefetch_bench}{{8.3}{29}} -\@writefile{toc}{\contentsline {section}{\numberline {8.3}GPGPU}{30}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.4}{\ignorespaces Word Count によるデータ並列実行のベンチマーク}}{30}} -\newlabel{fig:dataparallel}{{8.4}{30}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.5}{\ignorespaces マルチコア CPU、OpenCL、CUDA における FFT}}{31}} -\newlabel{fig:fft_bench}{{8.5}{31}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.6}{\ignorespaces MacPro 2013 における FFT}}{32}} -\newlabel{fig:fft_bench_dragonfly}{{8.6}{32}} -\@writefile{toc}{\contentsline {section}{\numberline {8.4}並列 I/O}{32}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.7}{\ignorespaces WordCount によるファイル読み込み方式のベンチマーク(MacPro2010)}}{33}} -\newlabel{fig:io_bench_firefly}{{8.7}{33}} -\@writefile{lof}{\contentsline {figure}{\numberline {8.8}{\ignorespaces WordCount によるファイル読み込み方式のベンチマーク(MacPro2013)}}{33}} -\newlabel{fig:io_bench_dragonfly}{{8.8}{33}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第9章}既存のプログラミングフレームワークとの比較}{35}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\@writefile{toc}{\contentsline {section}{\numberline {9.1}OpenCL}{35}} -\@writefile{lof}{\contentsline {figure}{\numberline {9.1}{\ignorespaces WorkItem ID}}{36}} -\newlabel{fig:workitem_id}{{9.1}{36}} -\@writefile{lot}{\contentsline {table}{\numberline {9.1}{\ignorespaces kernel で使用する ID 取得の API}}{36}} -\newlabel{table:kernel_id_api}{{9.1}{36}} -\@writefile{toc}{\contentsline {section}{\numberline {9.2}CUDA}{36}} -\@writefile{lof}{\contentsline {figure}{\numberline {9.2}{\ignorespaces Calculate Index example}}{37}} -\newlabel{fig:calculateIndex}{{9.2}{37}} -\@writefile{toc}{\contentsline {section}{\numberline {9.3}StarPU}{37}} -\@writefile{lof}{\contentsline {figure}{\numberline {9.3}{\ignorespaces StarPUにおけるデータ分割}}{38}} -\newlabel{fig:data_partition}{{9.3}{38}} -\@writefile{toc}{\contentsline {chapter}{\numberline {第10章}結論}{39}} -\@writefile{lof}{\addvspace {10\p@ }} -\@writefile{lot}{\addvspace {10\p@ }} -\newlabel{chapter:conclusion}{{10}{39}} -\@writefile{toc}{\contentsline {section}{\numberline {10.1}まとめ}{39}} -\@writefile{toc}{\contentsline {section}{\numberline {10.2}今後の課題}{40}} -\citation{*} -\bibstyle{junsrt} -\bibdata{master_paper} -\@writefile{toc}{\contentsline {chapter}{謝辞}{41}} -\bibcite{yutaka:2012a}{1} -\bibcite{daichi:2012a}{2} -\bibcite{yuhi:2013a}{3} -\bibcite{yuhi:2014a}{4} -\bibcite{kkb:2014a}{5} -\bibcite{masa:2014a}{6} -\bibcite{fft}{7} -\bibcite{cell}{8} -\bibcite{opencl}{9} -\bibcite{starpu}{10} -\bibcite{cuda}{11} -\@writefile{toc}{\contentsline {chapter}{参考文献}{42}} -\@writefile{toc}{\contentsline {chapter}{発表文献}{43}}