[PATCH 2/6] Squashfs: enhance parallel I/O

2013-11-07 Thread Phillip Lougher
From: Minchan Kim 

Now squashfs have used for only one stream buffer for decompression
so it hurts parallel read performance so this patch supports
multiple decompressor to enhance performance parallel I/O.

Four 1G file dd read on KVM machine which has 2 CPU and 4G memory.

dd if=test/test1.dat of=/dev/null &
dd if=test/test2.dat of=/dev/null &
dd if=test/test3.dat of=/dev/null &
dd if=test/test4.dat of=/dev/null &

old : 1m39s -> new : 9s

* From v1
  * Change comp_strm with decomp_strm - Phillip
  * Change/add comments - Phillip

Signed-off-by: Minchan Kim 
Signed-off-by: Phillip Lougher 
---
 fs/squashfs/Kconfig  |   13 +++
 fs/squashfs/Makefile |9 +-
 fs/squashfs/decompressor_multi.c |  200 ++
 3 files changed, 221 insertions(+), 1 deletion(-)
 create mode 100644 fs/squashfs/decompressor_multi.c

diff --git a/fs/squashfs/Kconfig b/fs/squashfs/Kconfig
index c70111e..1c6d340 100644
--- a/fs/squashfs/Kconfig
+++ b/fs/squashfs/Kconfig
@@ -63,6 +63,19 @@ config SQUASHFS_LZO
 
  If unsure, say N.
 
+config SQUASHFS_MULTI_DECOMPRESSOR
+   bool "Use multiple decompressors for handling parallel I/O"
+   depends on SQUASHFS
+   help
+ By default Squashfs uses a single decompressor but it gives
+ poor performance on parallel I/O workloads when using multiple CPU
+ machines due to waiting on decompressor availability.
+
+ If you have a parallel I/O workload and your system has enough memory,
+ using this option may improve overall I/O performance.
+
+ If unsure, say N.
+
 config SQUASHFS_XZ
bool "Include support for XZ compressed file systems"
depends on SQUASHFS
diff --git a/fs/squashfs/Makefile b/fs/squashfs/Makefile
index c223c84..dfebc3b 100644
--- a/fs/squashfs/Makefile
+++ b/fs/squashfs/Makefile
@@ -4,8 +4,15 @@
 
 obj-$(CONFIG_SQUASHFS) += squashfs.o
 squashfs-y += block.o cache.o dir.o export.o file.o fragment.o id.o inode.o
-squashfs-y += namei.o super.o symlink.o decompressor.o decompressor_single.o
+squashfs-y += namei.o super.o symlink.o decompressor.o
+
 squashfs-$(CONFIG_SQUASHFS_XATTR) += xattr.o xattr_id.o
 squashfs-$(CONFIG_SQUASHFS_LZO) += lzo_wrapper.o
 squashfs-$(CONFIG_SQUASHFS_XZ) += xz_wrapper.o
 squashfs-$(CONFIG_SQUASHFS_ZLIB) += zlib_wrapper.o
+
+ifdef CONFIG_SQUASHFS_MULTI_DECOMPRESSOR
+   squashfs-y  += decompressor_multi.o
+else
+   squashfs-y  += decompressor_single.o
+endif
diff --git a/fs/squashfs/decompressor_multi.c b/fs/squashfs/decompressor_multi.c
new file mode 100644
index 000..462731d
--- /dev/null
+++ b/fs/squashfs/decompressor_multi.c
@@ -0,0 +1,200 @@
+/*
+ *  Copyright (c) 2013
+ *  Minchan Kim 
+ *
+ *  This work is licensed under the terms of the GNU GPL, version 2. See
+ *  the COPYING file in the top-level directory.
+ */
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+#include 
+
+#include "squashfs_fs.h"
+#include "squashfs_fs_sb.h"
+#include "decompressor.h"
+#include "squashfs.h"
+
+/*
+ * This file implements multi-threaded decompression in the
+ * decompressor framework
+ */
+
+
+/*
+ * The reason that multiply two is that a CPU can request new I/O
+ * while it is waiting previous request.
+ */
+#define MAX_DECOMPRESSOR   (num_online_cpus() * 2)
+
+
+int squashfs_max_decompressors(void)
+{
+   return MAX_DECOMPRESSOR;
+}
+
+
+struct squashfs_stream {
+   void*comp_opts;
+   struct list_headstrm_list;
+   struct mutexmutex;
+   int avail_decomp;
+   wait_queue_head_t   wait;
+};
+
+
+struct decomp_stream {
+   void *stream;
+   struct list_head list;
+};
+
+
+static void put_decomp_stream(struct decomp_stream *decomp_strm,
+   struct squashfs_stream *stream)
+{
+   mutex_lock(>mutex);
+   list_add(_strm->list, >strm_list);
+   mutex_unlock(>mutex);
+   wake_up(>wait);
+}
+
+void *squashfs_decompressor_create(struct squashfs_sb_info *msblk,
+   void *comp_opts)
+{
+   struct squashfs_stream *stream;
+   struct decomp_stream *decomp_strm = NULL;
+   int err = -ENOMEM;
+
+   stream = kzalloc(sizeof(*stream), GFP_KERNEL);
+   if (!stream)
+   goto out;
+
+   stream->comp_opts = comp_opts;
+   mutex_init(>mutex);
+   INIT_LIST_HEAD(>strm_list);
+   init_waitqueue_head(>wait);
+
+   /*
+* We should have a decompressor at least as default
+* so if we fail to allocate new decompressor dynamically,
+* we could always fall back to default decompressor and
+* file system works.
+*/
+   decomp_strm = kmalloc(sizeof(*decomp_strm), GFP_KERNEL);
+   if (!decomp_strm)
+   goto out;
+
+   decomp_strm->stream = msblk->decompressor->init(msblk,
+   

[PATCH 2/6] Squashfs: enhance parallel I/O

2013-11-07 Thread Phillip Lougher
From: Minchan Kim minc...@kernel.org

Now squashfs have used for only one stream buffer for decompression
so it hurts parallel read performance so this patch supports
multiple decompressor to enhance performance parallel I/O.

Four 1G file dd read on KVM machine which has 2 CPU and 4G memory.

dd if=test/test1.dat of=/dev/null 
dd if=test/test2.dat of=/dev/null 
dd if=test/test3.dat of=/dev/null 
dd if=test/test4.dat of=/dev/null 

old : 1m39s - new : 9s

* From v1
  * Change comp_strm with decomp_strm - Phillip
  * Change/add comments - Phillip

Signed-off-by: Minchan Kim minc...@kernel.org
Signed-off-by: Phillip Lougher phil...@squashfs.org.uk
---
 fs/squashfs/Kconfig  |   13 +++
 fs/squashfs/Makefile |9 +-
 fs/squashfs/decompressor_multi.c |  200 ++
 3 files changed, 221 insertions(+), 1 deletion(-)
 create mode 100644 fs/squashfs/decompressor_multi.c

diff --git a/fs/squashfs/Kconfig b/fs/squashfs/Kconfig
index c70111e..1c6d340 100644
--- a/fs/squashfs/Kconfig
+++ b/fs/squashfs/Kconfig
@@ -63,6 +63,19 @@ config SQUASHFS_LZO
 
  If unsure, say N.
 
+config SQUASHFS_MULTI_DECOMPRESSOR
+   bool Use multiple decompressors for handling parallel I/O
+   depends on SQUASHFS
+   help
+ By default Squashfs uses a single decompressor but it gives
+ poor performance on parallel I/O workloads when using multiple CPU
+ machines due to waiting on decompressor availability.
+
+ If you have a parallel I/O workload and your system has enough memory,
+ using this option may improve overall I/O performance.
+
+ If unsure, say N.
+
 config SQUASHFS_XZ
bool Include support for XZ compressed file systems
depends on SQUASHFS
diff --git a/fs/squashfs/Makefile b/fs/squashfs/Makefile
index c223c84..dfebc3b 100644
--- a/fs/squashfs/Makefile
+++ b/fs/squashfs/Makefile
@@ -4,8 +4,15 @@
 
 obj-$(CONFIG_SQUASHFS) += squashfs.o
 squashfs-y += block.o cache.o dir.o export.o file.o fragment.o id.o inode.o
-squashfs-y += namei.o super.o symlink.o decompressor.o decompressor_single.o
+squashfs-y += namei.o super.o symlink.o decompressor.o
+
 squashfs-$(CONFIG_SQUASHFS_XATTR) += xattr.o xattr_id.o
 squashfs-$(CONFIG_SQUASHFS_LZO) += lzo_wrapper.o
 squashfs-$(CONFIG_SQUASHFS_XZ) += xz_wrapper.o
 squashfs-$(CONFIG_SQUASHFS_ZLIB) += zlib_wrapper.o
+
+ifdef CONFIG_SQUASHFS_MULTI_DECOMPRESSOR
+   squashfs-y  += decompressor_multi.o
+else
+   squashfs-y  += decompressor_single.o
+endif
diff --git a/fs/squashfs/decompressor_multi.c b/fs/squashfs/decompressor_multi.c
new file mode 100644
index 000..462731d
--- /dev/null
+++ b/fs/squashfs/decompressor_multi.c
@@ -0,0 +1,200 @@
+/*
+ *  Copyright (c) 2013
+ *  Minchan Kim minc...@kernel.org
+ *
+ *  This work is licensed under the terms of the GNU GPL, version 2. See
+ *  the COPYING file in the top-level directory.
+ */
+#include linux/types.h
+#include linux/mutex.h
+#include linux/slab.h
+#include linux/buffer_head.h
+#include linux/sched.h
+#include linux/wait.h
+#include linux/cpumask.h
+
+#include squashfs_fs.h
+#include squashfs_fs_sb.h
+#include decompressor.h
+#include squashfs.h
+
+/*
+ * This file implements multi-threaded decompression in the
+ * decompressor framework
+ */
+
+
+/*
+ * The reason that multiply two is that a CPU can request new I/O
+ * while it is waiting previous request.
+ */
+#define MAX_DECOMPRESSOR   (num_online_cpus() * 2)
+
+
+int squashfs_max_decompressors(void)
+{
+   return MAX_DECOMPRESSOR;
+}
+
+
+struct squashfs_stream {
+   void*comp_opts;
+   struct list_headstrm_list;
+   struct mutexmutex;
+   int avail_decomp;
+   wait_queue_head_t   wait;
+};
+
+
+struct decomp_stream {
+   void *stream;
+   struct list_head list;
+};
+
+
+static void put_decomp_stream(struct decomp_stream *decomp_strm,
+   struct squashfs_stream *stream)
+{
+   mutex_lock(stream-mutex);
+   list_add(decomp_strm-list, stream-strm_list);
+   mutex_unlock(stream-mutex);
+   wake_up(stream-wait);
+}
+
+void *squashfs_decompressor_create(struct squashfs_sb_info *msblk,
+   void *comp_opts)
+{
+   struct squashfs_stream *stream;
+   struct decomp_stream *decomp_strm = NULL;
+   int err = -ENOMEM;
+
+   stream = kzalloc(sizeof(*stream), GFP_KERNEL);
+   if (!stream)
+   goto out;
+
+   stream-comp_opts = comp_opts;
+   mutex_init(stream-mutex);
+   INIT_LIST_HEAD(stream-strm_list);
+   init_waitqueue_head(stream-wait);
+
+   /*
+* We should have a decompressor at least as default
+* so if we fail to allocate new decompressor dynamically,
+* we could always fall back to default decompressor and
+* file system works.
+*/
+   decomp_strm =