From: Stephen Rothwell <sfr@canb.auug.org.au>
Date: Tue, 27 Sep 2011 06:28:30 +0000 (+1000)
Subject: Merge remote-tracking branch 'moduleh/module.h-split'
X-Git-Tag: next-20110927~3
X-Git-Url: https://git.karo-electronics.de/?a=commitdiff_plain;h=19605f333e751ac43727179f5d9ccfadfd7805bb;p=karo-tx-linux.git

Merge remote-tracking branch 'moduleh/module.h-split'

Conflicts:
	arch/arm/mach-bcmring/mm.c
	arch/powerpc/mm/tlb_nohash.c
	drivers/media/dvb/frontends/dibx000_common.c
	drivers/mfd/ab3550-core.c
	drivers/mmc/host/sdhci-pci.c
	drivers/s390/char/vmur.c
	drivers/scsi/libfc/fc_lport.c
	include/linux/dmaengine.h
---

19605f333e751ac43727179f5d9ccfadfd7805bb
diff --cc arch/arm/common/scoop.c
index 1cde34a080d7,f749e60639ee..3229323eeb57
--- a/arch/arm/common/scoop.c
+++ b/arch/arm/common/scoop.c
@@@ -11,8 -11,8 +11,9 @@@
   *
   */
  
+ #include <linux/export.h>
  #include <linux/device.h>
 +#include <linux/gpio.h>
  #include <linux/string.h>
  #include <linux/slab.h>
  #include <linux/platform_device.h>
diff --cc arch/arm/mach-bcmring/mm.c
index 8616876abb9f,293b6d3e0d1d..1adec78ec940
--- a/arch/arm/mach-bcmring/mm.c
+++ b/arch/arm/mach-bcmring/mm.c
@@@ -13,7 -13,7 +13,8 @@@
  *****************************************************************************/
  
  #include <linux/platform_device.h>
 +#include <linux/dma-mapping.h>
+ #include <asm/page.h>
  #include <asm/mach/map.h>
  
  #include <mach/hardware.h>
diff --cc arch/arm/mach-omap2/voltage.c
index 64070ac1e761,e964cfd3a3d0..1f8fdf736e63
--- a/arch/arm/mach-omap2/voltage.c
+++ b/arch/arm/mach-omap2/voltage.c
@@@ -21,10 -21,11 +21,11 @@@
  
  #include <linux/delay.h>
  #include <linux/io.h>
 -#include <linux/clk.h>
  #include <linux/err.h>
+ #include <linux/export.h>
  #include <linux/debugfs.h>
  #include <linux/slab.h>
 +#include <linux/clk.h>
  
  #include <plat/common.h>
  
diff --cc arch/mips/bcm47xx/setup.c
index 17c3d14d7c49,0eda3808ee9d..6084dc24b18c
--- a/arch/mips/bcm47xx/setup.c
+++ b/arch/mips/bcm47xx/setup.c
@@@ -27,9 -27,9 +27,10 @@@
   */
  
  #include <linux/types.h>
+ #include <linux/export.h>
  #include <linux/ssb/ssb.h>
  #include <linux/ssb/ssb_embedded.h>
 +#include <linux/bcma/bcma_soc.h>
  #include <asm/bootinfo.h>
  #include <asm/reboot.h>
  #include <asm/time.h>
diff --cc arch/powerpc/mm/tlb_nohash.c
index afc95c7304ae,ab06aea8a163..f2762556e5ef
--- a/arch/powerpc/mm/tlb_nohash.c
+++ b/arch/powerpc/mm/tlb_nohash.c
@@@ -36,7 -36,7 +36,8 @@@
  #include <linux/spinlock.h>
  #include <linux/memblock.h>
  #include <linux/of_fdt.h>
 +#include <linux/hugetlb.h>
+ #include <linux/export.h>
  
  #include <asm/tlbflush.h>
  #include <asm/tlb.h>
diff --cc arch/x86/crypto/aes_glue.c
index b0b6950cc8c8,bdce3eeeaa37..8efcf42a9d7e
--- a/arch/x86/crypto/aes_glue.c
+++ b/arch/x86/crypto/aes_glue.c
@@@ -3,8 -3,8 +3,9 @@@
   *
   */
  
+ #include <linux/module.h>
  #include <crypto/aes.h>
 +#include <asm/aes.h>
  
  asmlinkage void aes_enc_blk(struct crypto_aes_ctx *ctx, u8 *out, const u8 *in);
  asmlinkage void aes_dec_blk(struct crypto_aes_ctx *ctx, u8 *out, const u8 *in);
diff --cc arch/x86/kernel/cpu/amd.c
index 13c6ec812545,b070bde05825..ef2e3462702d
--- a/arch/x86/kernel/cpu/amd.c
+++ b/arch/x86/kernel/cpu/amd.c
@@@ -1,6 -1,6 +1,7 @@@
+ #include <linux/export.h>
  #include <linux/init.h>
  #include <linux/bitops.h>
 +#include <linux/elf.h>
  #include <linux/mm.h>
  
  #include <linux/io.h>
diff --cc block/bsg-lib.c
index 6690e6e41037,000000000000..7ad49c88f6b1
mode 100644,000000..100644
--- a/block/bsg-lib.c
+++ b/block/bsg-lib.c
@@@ -1,298 -1,0 +1,298 @@@
 +/*
 + *  BSG helper library
 + *
 + *  Copyright (C) 2008   James Smart, Emulex Corporation
 + *  Copyright (C) 2011   Red Hat, Inc.  All rights reserved.
 + *  Copyright (C) 2011   Mike Christie
 + *
 + *  This program is free software; you can redistribute it and/or modify
 + *  it under the terms of the GNU General Public License as published by
 + *  the Free Software Foundation; either version 2 of the License, or
 + *  (at your option) any later version.
 + *
 + *  This program is distributed in the hope that it will be useful,
 + *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 + *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 + *  GNU General Public License for more details.
 + *
 + *  You should have received a copy of the GNU General Public License
 + *  along with this program; if not, write to the Free Software
 + *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 + *
 + */
 +#include <linux/slab.h>
 +#include <linux/blkdev.h>
 +#include <linux/delay.h>
 +#include <linux/scatterlist.h>
 +#include <linux/bsg-lib.h>
- #include <linux/module.h>
++#include <linux/export.h>
 +#include <scsi/scsi_cmnd.h>
 +
 +/**
 + * bsg_destroy_job - routine to teardown/delete a bsg job
 + * @job: bsg_job that is to be torn down
 + */
 +static void bsg_destroy_job(struct bsg_job *job)
 +{
 +	put_device(job->dev);	/* release reference for the request */
 +
 +	kfree(job->request_payload.sg_list);
 +	kfree(job->reply_payload.sg_list);
 +	kfree(job);
 +}
 +
 +/**
 + * bsg_job_done - completion routine for bsg requests
 + * @job: bsg_job that is complete
 + * @result: job reply result
 + * @reply_payload_rcv_len: length of payload recvd
 + *
 + * The LLD should call this when the bsg job has completed.
 + */
 +void bsg_job_done(struct bsg_job *job, int result,
 +		  unsigned int reply_payload_rcv_len)
 +{
 +	struct request *req = job->req;
 +	struct request *rsp = req->next_rq;
 +	int err;
 +
 +	err = job->req->errors = result;
 +	if (err < 0)
 +		/* we're only returning the result field in the reply */
 +		job->req->sense_len = sizeof(u32);
 +	else
 +		job->req->sense_len = job->reply_len;
 +	/* we assume all request payload was transferred, residual == 0 */
 +	req->resid_len = 0;
 +
 +	if (rsp) {
 +		WARN_ON(reply_payload_rcv_len > rsp->resid_len);
 +
 +		/* set reply (bidi) residual */
 +		rsp->resid_len -= min(reply_payload_rcv_len, rsp->resid_len);
 +	}
 +	blk_complete_request(req);
 +}
 +EXPORT_SYMBOL_GPL(bsg_job_done);
 +
 +/**
 + * bsg_softirq_done - softirq done routine for destroying the bsg requests
 + * @rq: BSG request that holds the job to be destroyed
 + */
 +static void bsg_softirq_done(struct request *rq)
 +{
 +	struct bsg_job *job = rq->special;
 +
 +	blk_end_request_all(rq, rq->errors);
 +	bsg_destroy_job(job);
 +}
 +
 +static int bsg_map_buffer(struct bsg_buffer *buf, struct request *req)
 +{
 +	size_t sz = (sizeof(struct scatterlist) * req->nr_phys_segments);
 +
 +	BUG_ON(!req->nr_phys_segments);
 +
 +	buf->sg_list = kzalloc(sz, GFP_KERNEL);
 +	if (!buf->sg_list)
 +		return -ENOMEM;
 +	sg_init_table(buf->sg_list, req->nr_phys_segments);
 +	buf->sg_cnt = blk_rq_map_sg(req->q, req, buf->sg_list);
 +	buf->payload_len = blk_rq_bytes(req);
 +	return 0;
 +}
 +
 +/**
 + * bsg_create_job - create the bsg_job structure for the bsg request
 + * @dev: device that is being sent the bsg request
 + * @req: BSG request that needs a job structure
 + */
 +static int bsg_create_job(struct device *dev, struct request *req)
 +{
 +	struct request *rsp = req->next_rq;
 +	struct request_queue *q = req->q;
 +	struct bsg_job *job;
 +	int ret;
 +
 +	BUG_ON(req->special);
 +
 +	job = kzalloc(sizeof(struct bsg_job) + q->bsg_job_size, GFP_KERNEL);
 +	if (!job)
 +		return -ENOMEM;
 +
 +	req->special = job;
 +	job->req = req;
 +	if (q->bsg_job_size)
 +		job->dd_data = (void *)&job[1];
 +	job->request = req->cmd;
 +	job->request_len = req->cmd_len;
 +	job->reply = req->sense;
 +	job->reply_len = SCSI_SENSE_BUFFERSIZE;	/* Size of sense buffer
 +						 * allocated */
 +	if (req->bio) {
 +		ret = bsg_map_buffer(&job->request_payload, req);
 +		if (ret)
 +			goto failjob_rls_job;
 +	}
 +	if (rsp && rsp->bio) {
 +		ret = bsg_map_buffer(&job->reply_payload, rsp);
 +		if (ret)
 +			goto failjob_rls_rqst_payload;
 +	}
 +	job->dev = dev;
 +	/* take a reference for the request */
 +	get_device(job->dev);
 +	return 0;
 +
 +failjob_rls_rqst_payload:
 +	kfree(job->request_payload.sg_list);
 +failjob_rls_job:
 +	kfree(job);
 +	return -ENOMEM;
 +}
 +
 +/*
 + * bsg_goose_queue - restart queue in case it was stopped
 + * @q: request q to be restarted
 + */
 +void bsg_goose_queue(struct request_queue *q)
 +{
 +	if (!q)
 +		return;
 +
 +	blk_run_queue_async(q);
 +}
 +EXPORT_SYMBOL_GPL(bsg_goose_queue);
 +
 +/**
 + * bsg_request_fn - generic handler for bsg requests
 + * @q: request queue to manage
 + *
 + * On error the create_bsg_job function should return a -Exyz error value
 + * that will be set to the req->errors.
 + *
 + * Drivers/subsys should pass this to the queue init function.
 + */
 +void bsg_request_fn(struct request_queue *q)
 +{
 +	struct device *dev = q->queuedata;
 +	struct request *req;
 +	struct bsg_job *job;
 +	int ret;
 +
 +	if (!get_device(dev))
 +		return;
 +
 +	while (1) {
 +		req = blk_fetch_request(q);
 +		if (!req)
 +			break;
 +		spin_unlock_irq(q->queue_lock);
 +
 +		ret = bsg_create_job(dev, req);
 +		if (ret) {
 +			req->errors = ret;
 +			blk_end_request_all(req, ret);
 +			spin_lock_irq(q->queue_lock);
 +			continue;
 +		}
 +
 +		job = req->special;
 +		ret = q->bsg_job_fn(job);
 +		spin_lock_irq(q->queue_lock);
 +		if (ret)
 +			break;
 +	}
 +
 +	spin_unlock_irq(q->queue_lock);
 +	put_device(dev);
 +	spin_lock_irq(q->queue_lock);
 +}
 +EXPORT_SYMBOL_GPL(bsg_request_fn);
 +
 +/**
 + * bsg_setup_queue - Create and add the bsg hooks so we can receive requests
 + * @dev: device to attach bsg device to
 + * @q: request queue setup by caller
 + * @name: device to give bsg device
 + * @job_fn: bsg job handler
 + * @dd_job_size: size of LLD data needed for each job
 + *
 + * The caller should have setup the reuqest queue with bsg_request_fn
 + * as the request_fn.
 + */
 +int bsg_setup_queue(struct device *dev, struct request_queue *q,
 +		    char *name, bsg_job_fn *job_fn, int dd_job_size)
 +{
 +	int ret;
 +
 +	q->queuedata = dev;
 +	q->bsg_job_size = dd_job_size;
 +	q->bsg_job_fn = job_fn;
 +	queue_flag_set_unlocked(QUEUE_FLAG_BIDI, q);
 +	blk_queue_softirq_done(q, bsg_softirq_done);
 +	blk_queue_rq_timeout(q, BLK_DEFAULT_SG_TIMEOUT);
 +
 +	ret = bsg_register_queue(q, dev, name, NULL);
 +	if (ret) {
 +		printk(KERN_ERR "%s: bsg interface failed to "
 +		       "initialize - register queue\n", dev->kobj.name);
 +		return ret;
 +	}
 +
 +	return 0;
 +}
 +EXPORT_SYMBOL_GPL(bsg_setup_queue);
 +
 +/**
 + * bsg_remove_queue - Deletes the bsg dev from the q
 + * @q:	the request_queue that is to be torn down.
 + *
 + * Notes:
 + *   Before unregistering the queue empty any requests that are blocked
 + */
 +void bsg_remove_queue(struct request_queue *q)
 +{
 +	struct request *req; /* block request */
 +	int counts; /* totals for request_list count and starved */
 +
 +	if (!q)
 +		return;
 +
 +	/* Stop taking in new requests */
 +	spin_lock_irq(q->queue_lock);
 +	blk_stop_queue(q);
 +
 +	/* drain all requests in the queue */
 +	while (1) {
 +		/* need the lock to fetch a request
 +		 * this may fetch the same reqeust as the previous pass
 +		 */
 +		req = blk_fetch_request(q);
 +		/* save requests in use and starved */
 +		counts = q->rq.count[0] + q->rq.count[1] +
 +			 q->rq.starved[0] + q->rq.starved[1];
 +		spin_unlock_irq(q->queue_lock);
 +		/* any requests still outstanding? */
 +		if (counts == 0)
 +			break;
 +
 +		/* This may be the same req as the previous iteration,
 +		 * always send the blk_end_request_all after a prefetch.
 +		 * It is not okay to not end the request because the
 +		 * prefetch started the request.
 +		 */
 +		if (req) {
 +			/* return -ENXIO to indicate that this queue is
 +			 * going away
 +			 */
 +			req->errors = -ENXIO;
 +			blk_end_request_all(req, -ENXIO);
 +		}
 +
 +		msleep(200); /* allow bsg to possibly finish */
 +		spin_lock_irq(q->queue_lock);
 +	}
 +	bsg_unregister_queue(q);
 +}
 +EXPORT_SYMBOL_GPL(bsg_remove_queue);
diff --cc drivers/base/power/common.c
index 29820c396182,000000000000..4af7c1cbf909
mode 100644,000000..100644
--- a/drivers/base/power/common.c
+++ b/drivers/base/power/common.c
@@@ -1,86 -1,0 +1,86 @@@
 +/*
 + * drivers/base/power/common.c - Common device power management code.
 + *
 + * Copyright (C) 2011 Rafael J. Wysocki <rjw@sisk.pl>, Renesas Electronics Corp.
 + *
 + * This file is released under the GPLv2.
 + */
 +
 +#include <linux/init.h>
 +#include <linux/kernel.h>
- #include <linux/module.h>
++#include <linux/export.h>
 +#include <linux/slab.h>
 +#include <linux/pm_clock.h>
 +
 +/**
 + * dev_pm_get_subsys_data - Create or refcount power.subsys_data for device.
 + * @dev: Device to handle.
 + *
 + * If power.subsys_data is NULL, point it to a new object, otherwise increment
 + * its reference counter.  Return 1 if a new object has been created, otherwise
 + * return 0 or error code.
 + */
 +int dev_pm_get_subsys_data(struct device *dev)
 +{
 +	struct pm_subsys_data *psd;
 +	int ret = 0;
 +
 +	psd = kzalloc(sizeof(*psd), GFP_KERNEL);
 +	if (!psd)
 +		return -ENOMEM;
 +
 +	spin_lock_irq(&dev->power.lock);
 +
 +	if (dev->power.subsys_data) {
 +		dev->power.subsys_data->refcount++;
 +	} else {
 +		spin_lock_init(&psd->lock);
 +		psd->refcount = 1;
 +		dev->power.subsys_data = psd;
 +		pm_clk_init(dev);
 +		psd = NULL;
 +		ret = 1;
 +	}
 +
 +	spin_unlock_irq(&dev->power.lock);
 +
 +	/* kfree() verifies that its argument is nonzero. */
 +	kfree(psd);
 +
 +	return ret;
 +}
 +EXPORT_SYMBOL_GPL(dev_pm_get_subsys_data);
 +
 +/**
 + * dev_pm_put_subsys_data - Drop reference to power.subsys_data.
 + * @dev: Device to handle.
 + *
 + * If the reference counter of power.subsys_data is zero after dropping the
 + * reference, power.subsys_data is removed.  Return 1 if that happens or 0
 + * otherwise.
 + */
 +int dev_pm_put_subsys_data(struct device *dev)
 +{
 +	struct pm_subsys_data *psd;
 +	int ret = 0;
 +
 +	spin_lock_irq(&dev->power.lock);
 +
 +	psd = dev_to_psd(dev);
 +	if (!psd) {
 +		ret = -EINVAL;
 +		goto out;
 +	}
 +
 +	if (--psd->refcount == 0) {
 +		dev->power.subsys_data = NULL;
 +		kfree(psd);
 +		ret = 1;
 +	}
 +
 + out:
 +	spin_unlock_irq(&dev->power.lock);
 +
 +	return ret;
 +}
 +EXPORT_SYMBOL_GPL(dev_pm_put_subsys_data);
diff --cc drivers/bcma/driver_chipcommon_pmu.c
index 2968d809d49f,fcc63db0ce75..800163c8c2e7
--- a/drivers/bcma/driver_chipcommon_pmu.c
+++ b/drivers/bcma/driver_chipcommon_pmu.c
@@@ -9,49 -9,22 +9,50 @@@
   */
  
  #include "bcma_private.h"
++#include <linux/export.h>
  #include <linux/bcma/bcma.h>
  
 -static void bcma_chipco_chipctl_maskset(struct bcma_drv_cc *cc,
 -					u32 offset, u32 mask, u32 set)
 +static u32 bcma_chipco_pll_read(struct bcma_drv_cc *cc, u32 offset)
  {
 -	u32 value;
 +	bcma_cc_write32(cc, BCMA_CC_PLLCTL_ADDR, offset);
 +	bcma_cc_read32(cc, BCMA_CC_PLLCTL_ADDR);
 +	return bcma_cc_read32(cc, BCMA_CC_PLLCTL_DATA);
 +}
  
 -	bcma_cc_read32(cc, BCMA_CC_CHIPCTL_ADDR);
 +void bcma_chipco_pll_write(struct bcma_drv_cc *cc, u32 offset, u32 value)
 +{
 +	bcma_cc_write32(cc, BCMA_CC_PLLCTL_ADDR, offset);
 +	bcma_cc_read32(cc, BCMA_CC_PLLCTL_ADDR);
 +	bcma_cc_write32(cc, BCMA_CC_PLLCTL_DATA, value);
 +}
 +EXPORT_SYMBOL_GPL(bcma_chipco_pll_write);
 +
 +void bcma_chipco_pll_maskset(struct bcma_drv_cc *cc, u32 offset, u32 mask,
 +			     u32 set)
 +{
 +	bcma_cc_write32(cc, BCMA_CC_PLLCTL_ADDR, offset);
 +	bcma_cc_read32(cc, BCMA_CC_PLLCTL_ADDR);
 +	bcma_cc_maskset32(cc, BCMA_CC_PLLCTL_DATA, mask, set);
 +}
 +EXPORT_SYMBOL_GPL(bcma_chipco_pll_maskset);
 +
 +void bcma_chipco_chipctl_maskset(struct bcma_drv_cc *cc,
 +				 u32 offset, u32 mask, u32 set)
 +{
  	bcma_cc_write32(cc, BCMA_CC_CHIPCTL_ADDR, offset);
  	bcma_cc_read32(cc, BCMA_CC_CHIPCTL_ADDR);
 -	value = bcma_cc_read32(cc, BCMA_CC_CHIPCTL_DATA);
 -	value &= mask;
 -	value |= set;
 -	bcma_cc_write32(cc, BCMA_CC_CHIPCTL_DATA, value);
 -	bcma_cc_read32(cc, BCMA_CC_CHIPCTL_DATA);
 +	bcma_cc_maskset32(cc, BCMA_CC_CHIPCTL_DATA, mask, set);
 +}
 +EXPORT_SYMBOL_GPL(bcma_chipco_chipctl_maskset);
 +
 +void bcma_chipco_regctl_maskset(struct bcma_drv_cc *cc, u32 offset, u32 mask,
 +				u32 set)
 +{
 +	bcma_cc_write32(cc, BCMA_CC_REGCTL_ADDR, offset);
 +	bcma_cc_read32(cc, BCMA_CC_REGCTL_ADDR);
 +	bcma_cc_maskset32(cc, BCMA_CC_REGCTL_DATA, mask, set);
  }
 +EXPORT_SYMBOL_GPL(bcma_chipco_regctl_maskset);
  
  static void bcma_pmu_pll_init(struct bcma_drv_cc *cc)
  {
diff --cc drivers/gpio/gpio-mxc.c
index b588f8a41e60,73a177b92e84..0f189b34bda3
--- a/drivers/gpio/gpio-mxc.c
+++ b/drivers/gpio/gpio-mxc.c
@@@ -29,10 -29,9 +29,11 @@@
  #include <linux/basic_mmio_gpio.h>
  #include <linux/of.h>
  #include <linux/of_device.h>
+ #include <linux/module.h>
  #include <asm-generic/bug.h>
  
 +#define irq_to_gpio(irq)	((irq) - MXC_GPIO_IRQ_START)
 +
  enum mxc_gpio_hwtype {
  	IMX1_GPIO,	/* runs on i.mx1 */
  	IMX21_GPIO,	/* runs on i.mx21 and i.mx27 */
diff --cc drivers/md/persistent-data/dm-btree-remove.c
index cdd71d67def9,000000000000..e7071f66dc39
mode 100644,000000..100644
--- a/drivers/md/persistent-data/dm-btree-remove.c
+++ b/drivers/md/persistent-data/dm-btree-remove.c
@@@ -1,571 -1,0 +1,571 @@@
 +/*
 + * Copyright (C) 2011 Red Hat, Inc. All rights reserved.
 + *
 + * This file is released under the GPL.
 + */
 +
 +#include "dm-btree.h"
 +#include "dm-btree-internal.h"
 +#include "dm-transaction-manager.h"
 +
- #include <linux/module.h>
++#include <linux/export.h>
 +
 +/*
 + * Removing an entry from a btree
 + * ==============================
 + *
 + * A very important constraint for our btree is that no node, except the
 + * root, may have fewer than a certain number of entries.
 + * (MIN_ENTRIES <= nr_entries <= MAX_ENTRIES).
 + *
 + * Ensuring this is complicated by the way we want to only ever hold the
 + * locks on 2 nodes concurrently, and only change nodes in a top to bottom
 + * fashion.
 + *
 + * Each node may have a left or right sibling.  When decending the spine,
 + * if a node contains only MIN_ENTRIES then we try and increase this to at
 + * least MIN_ENTRIES + 1.  We do this in the following ways:
 + *
 + * [A] No siblings => this can only happen if the node is the root, in which
 + *     case we copy the childs contents over the root.
 + *
 + * [B] No left sibling
 + *     ==> rebalance(node, right sibling)
 + *
 + * [C] No right sibling
 + *     ==> rebalance(left sibling, node)
 + *
 + * [D] Both siblings, total_entries(left, node, right) <= DEL_THRESHOLD
 + *     ==> delete node adding it's contents to left and right
 + *
 + * [E] Both siblings, total_entries(left, node, right) > DEL_THRESHOLD
 + *     ==> rebalance(left, node, right)
 + *
 + * After these operations it's possible that the our original node no
 + * longer contains the desired sub tree.  For this reason this rebalancing
 + * is performed on the children of the current node.  This also avoids
 + * having a special case for the root.
 + *
 + * Once this rebalancing has occurred we can then step into the child node
 + * for internal nodes.  Or delete the entry for leaf nodes.
 + */
 +
 +/*
 + * Some little utilities for moving node data around.
 + */
 +static void node_shift(struct node *n, int shift)
 +{
 +	uint32_t nr_entries = le32_to_cpu(n->header.nr_entries);
 +
 +	if (shift < 0) {
 +		shift = -shift;
 +		memmove(key_ptr(n, 0),
 +			key_ptr(n, shift),
 +			(nr_entries - shift) * sizeof(__le64));
 +		memmove(value_ptr(n, 0, sizeof(__le64)),
 +			value_ptr(n, shift, sizeof(__le64)),
 +			(nr_entries - shift) * sizeof(__le64));
 +	} else {
 +		memmove(key_ptr(n, shift),
 +			key_ptr(n, 0),
 +			nr_entries * sizeof(__le64));
 +		memmove(value_ptr(n, shift, sizeof(__le64)),
 +			value_ptr(n, 0, sizeof(__le64)),
 +			nr_entries * sizeof(__le64));
 +	}
 +}
 +
 +static void node_copy(struct node *left, struct node *right, int shift)
 +{
 +	uint32_t nr_left = le32_to_cpu(left->header.nr_entries);
 +
 +	if (shift < 0) {
 +		shift = -shift;
 +		memcpy(key_ptr(left, nr_left),
 +		       key_ptr(right, 0),
 +		       shift * sizeof(__le64));
 +		memcpy(value_ptr(left, nr_left, sizeof(__le64)),
 +		       value_ptr(right, 0, sizeof(__le64)),
 +		       shift * sizeof(__le64));
 +	} else {
 +		memcpy(key_ptr(right, 0),
 +		       key_ptr(left, nr_left - shift),
 +		       shift * sizeof(__le64));
 +		memcpy(value_ptr(right, 0, sizeof(__le64)),
 +		       value_ptr(left, nr_left - shift, sizeof(__le64)),
 +		       shift * sizeof(__le64));
 +	}
 +}
 +
 +/*
 + * Delete a specific entry from a leaf node.
 + */
 +static void delete_at(struct node *n, unsigned index, size_t value_size)
 +{
 +	unsigned nr_entries = le32_to_cpu(n->header.nr_entries);
 +	unsigned nr_to_copy = nr_entries - (index + 1);
 +
 +	if (nr_to_copy) {
 +		memmove(key_ptr(n, index),
 +			key_ptr(n, index + 1),
 +			nr_to_copy * sizeof(__le64));
 +
 +		memmove(value_ptr(n, index, value_size),
 +			value_ptr(n, index + 1, value_size),
 +			nr_to_copy * value_size);
 +	}
 +
 +	n->header.nr_entries = cpu_to_le32(nr_entries - 1);
 +}
 +
 +static unsigned del_threshold(struct node *n)
 +{
 +	return le32_to_cpu(n->header.max_entries) / 3;
 +}
 +
 +static unsigned merge_threshold(struct node *n)
 +{
 +	/*
 +	 * The extra one is because we know we're potentially going to
 +	 * delete an entry.
 +	 */
 +	return 2 * (le32_to_cpu(n->header.max_entries) / 3) + 1;
 +}
 +
 +struct child {
 +	unsigned index;
 +	struct dm_block *block;
 +	struct node *n;
 +};
 +
 +static struct dm_btree_value_type le64_type = {
 +	.context = NULL,
 +	.size = sizeof(__le64),
 +	.inc = NULL,
 +	.dec = NULL,
 +	.equal = NULL
 +};
 +
 +static int init_child(struct dm_btree_info *info, struct node *parent,
 +		      unsigned index, struct child *result)
 +{
 +	int r, inc;
 +	dm_block_t root;
 +
 +	result->index = index;
 +	root = value64(parent, index);
 +
 +	r = dm_tm_shadow_block(info->tm, root, &btree_node_validator,
 +			       &result->block, &inc);
 +	if (r)
 +		return r;
 +
 +	result->n = dm_block_data(result->block);
 +
 +	if (inc)
 +		inc_children(info->tm, result->n, &le64_type);
 +
 +	return 0;
 +}
 +
 +static int exit_child(struct dm_btree_info *info, struct child *c)
 +{
 +	return dm_tm_unlock(info->tm, c->block);
 +}
 +
 +static void shift(struct node *left, struct node *right, int count)
 +{
 +	if (!count)
 +		return;
 +
 +	if (count > 0) {
 +		node_shift(right, count);
 +		node_copy(left, right, count);
 +	} else {
 +		node_copy(left, right, count);
 +		node_shift(right, count);
 +	}
 +
 +	left->header.nr_entries =
 +		cpu_to_le32(le32_to_cpu(left->header.nr_entries) - count);
 +
 +	right->header.nr_entries =
 +		cpu_to_le32(le32_to_cpu(right->header.nr_entries) + count);
 +}
 +
 +static void __rebalance2(struct dm_btree_info *info, struct node *parent,
 +			 struct child *l, struct child *r)
 +{
 +	struct node *left = l->n;
 +	struct node *right = r->n;
 +	uint32_t nr_left = le32_to_cpu(left->header.nr_entries);
 +	uint32_t nr_right = le32_to_cpu(right->header.nr_entries);
 +
 +	if (nr_left + nr_right <= merge_threshold(left)) {
 +		/*
 +		 * Merge
 +		 */
 +		node_copy(left, right, -nr_right);
 +		left->header.nr_entries = cpu_to_le32(nr_left + nr_right);
 +
 +		*((__le64 *) value_ptr(parent, l->index, sizeof(__le64))) =
 +			cpu_to_le64(dm_block_location(l->block));
 +		delete_at(parent, r->index, sizeof(__le64));
 +
 +		/*
 +		 * We need to decrement the right block, but not it's
 +		 * children, since they're still referenced by left.
 +		 */
 +		dm_tm_dec(info->tm, dm_block_location(r->block));
 +	} else {
 +		/*
 +		 * Rebalance.
 +		 */
 +		unsigned target_left = (nr_left + nr_right) / 2;
 +
 +		shift(left, right, nr_left - target_left);
 +		*((__le64 *) value_ptr(parent, l->index, sizeof(__le64))) =
 +			cpu_to_le64(dm_block_location(l->block));
 +		*((__le64 *) value_ptr(parent, r->index, sizeof(__le64))) =
 +			cpu_to_le64(dm_block_location(r->block));
 +		*key_ptr(parent, r->index) = right->keys[0];
 +	}
 +}
 +
 +static int rebalance2(struct shadow_spine *s, struct dm_btree_info *info,
 +		      unsigned left_index)
 +{
 +	int r;
 +	struct node *parent;
 +	struct child left, right;
 +
 +	parent = dm_block_data(shadow_current(s));
 +
 +	r = init_child(info, parent, left_index, &left);
 +	if (r)
 +		return r;
 +
 +	r = init_child(info, parent, left_index + 1, &right);
 +	if (r) {
 +		exit_child(info, &left);
 +		return r;
 +	}
 +
 +	__rebalance2(info, parent, &left, &right);
 +
 +	r = exit_child(info, &left);
 +	if (r) {
 +		exit_child(info, &right);
 +		return r;
 +	}
 +
 +	r = exit_child(info, &right);
 +	if (r)
 +		return r;
 +
 +	return 0;
 +}
 +
 +static void __rebalance3(struct dm_btree_info *info, struct node *parent,
 +			 struct child *l, struct child *c, struct child *r)
 +{
 +	struct node *left = l->n;
 +	struct node *center = c->n;
 +	struct node *right = r->n;
 +
 +	uint32_t nr_left = le32_to_cpu(left->header.nr_entries);
 +	uint32_t nr_center = le32_to_cpu(center->header.nr_entries);
 +	uint32_t nr_right = le32_to_cpu(right->header.nr_entries);
 +	uint32_t max_entries = le32_to_cpu(left->header.max_entries);
 +
 +	unsigned target;
 +
 +	if (((nr_left + nr_center + nr_right) / 2) < merge_threshold(center)) {
 +		/*
 +		 * Delete center node:
 +		 *
 +		 * We dump as many entries from center as possible into
 +		 * left, then the rest in right, then rebalance2.  This
 +		 * wastes some cpu, but I want something simple atm.
 +		 */
 +		unsigned shift = min(max_entries - nr_left, nr_center);
 +
 +		node_copy(left, center, -shift);
 +		left->header.nr_entries = cpu_to_le32(nr_left + shift);
 +
 +		if (shift != nr_center) {
 +			shift = nr_center - shift;
 +			node_shift(right, shift);
 +			node_copy(center, right, shift);
 +			right->header.nr_entries = cpu_to_le32(nr_right + shift);
 +		}
 +
 +		*((__le64 *) value_ptr(parent, l->index, sizeof(__le64))) =
 +			cpu_to_le64(dm_block_location(l->block));
 +		*((__le64 *) value_ptr(parent, r->index, sizeof(__le64))) =
 +			cpu_to_le64(dm_block_location(r->block));
 +		*key_ptr(parent, r->index) = right->keys[0];
 +
 +		delete_at(parent, c->index, sizeof(__le64));
 +		r->index--;
 +
 +		dm_tm_dec(info->tm, dm_block_location(c->block));
 +		__rebalance2(info, parent, l, r);
 +
 +		return;
 +	}
 +
 +	/*
 +	 * Rebalance
 +	 */
 +	target = (nr_left + nr_center + nr_right) / 3;
 +	BUG_ON(target == nr_center);
 +
 +	/*
 +	 * Adjust the left node
 +	 */
 +	shift(left, center, nr_left - target);
 +
 +	/*
 +	 * Adjust the right node
 +	 */
 +	shift(center, right, target - nr_right);
 +
 +	*((__le64 *) value_ptr(parent, l->index, sizeof(__le64))) =
 +		cpu_to_le64(dm_block_location(l->block));
 +	*((__le64 *) value_ptr(parent, c->index, sizeof(__le64))) =
 +		cpu_to_le64(dm_block_location(c->block));
 +	*((__le64 *) value_ptr(parent, r->index, sizeof(__le64))) =
 +		cpu_to_le64(dm_block_location(r->block));
 +
 +	*key_ptr(parent, c->index) = center->keys[0];
 +	*key_ptr(parent, r->index) = right->keys[0];
 +}
 +
 +static int rebalance3(struct shadow_spine *s, struct dm_btree_info *info,
 +		      unsigned left_index)
 +{
 +	int r;
 +	struct node *parent = dm_block_data(shadow_current(s));
 +	struct child left, center, right;
 +
 +	/*
 +	 * FIXME: fill out an array?
 +	 */
 +	r = init_child(info, parent, left_index, &left);
 +	if (r)
 +		return r;
 +
 +	r = init_child(info, parent, left_index + 1, &center);
 +	if (r) {
 +		exit_child(info, &left);
 +		return r;
 +	}
 +
 +	r = init_child(info, parent, left_index + 2, &right);
 +	if (r) {
 +		exit_child(info, &left);
 +		exit_child(info, &center);
 +		return r;
 +	}
 +
 +	__rebalance3(info, parent, &left, &center, &right);
 +
 +	r = exit_child(info, &left);
 +	if (r) {
 +		exit_child(info, &center);
 +		exit_child(info, &right);
 +		return r;
 +	}
 +
 +	r = exit_child(info, &center);
 +	if (r) {
 +		exit_child(info, &right);
 +		return r;
 +	}
 +
 +	r = exit_child(info, &right);
 +	if (r)
 +		return r;
 +
 +	return 0;
 +}
 +
 +static int get_nr_entries(struct dm_transaction_manager *tm,
 +			  dm_block_t b, uint32_t *result)
 +{
 +	int r;
 +	struct dm_block *block;
 +	struct node *n;
 +
 +	r = dm_tm_read_lock(tm, b, &btree_node_validator, &block);
 +	if (r)
 +		return r;
 +
 +	n = dm_block_data(block);
 +	*result = le32_to_cpu(n->header.nr_entries);
 +
 +	return dm_tm_unlock(tm, block);
 +}
 +
 +static int rebalance_children(struct shadow_spine *s,
 +			      struct dm_btree_info *info, uint64_t key)
 +{
 +	int i, r, has_left_sibling, has_right_sibling;
 +	uint32_t child_entries;
 +	struct node *n;
 +
 +	n = dm_block_data(shadow_current(s));
 +
 +	if (le32_to_cpu(n->header.nr_entries) == 1) {
 +		struct dm_block *child;
 +		dm_block_t b = value64(n, 0);
 +
 +		r = dm_tm_read_lock(info->tm, b, &btree_node_validator, &child);
 +		if (r)
 +			return r;
 +
 +		memcpy(n, dm_block_data(child),
 +		       dm_bm_block_size(dm_tm_get_bm(info->tm)));
 +		r = dm_tm_unlock(info->tm, child);
 +		dm_tm_dec(info->tm, dm_block_location(child));
 +
 +		return r;
 +	}
 +
 +	i = lower_bound(n, key);
 +	if (i < 0)
 +		return -ENODATA;
 +
 +	r = get_nr_entries(info->tm, value64(n, i), &child_entries);
 +	if (r)
 +		return r;
 +
 +	if (child_entries > del_threshold(n))
 +		return 0;
 +
 +	has_left_sibling = i > 0 ? 1 : 0;
 +	has_right_sibling =
 +		(i >= (le32_to_cpu(n->header.nr_entries) - 1)) ? 0 : 1;
 +
 +	if (!has_left_sibling)
 +		r = rebalance2(s, info, i);
 +
 +	else if (!has_right_sibling)
 +		r = rebalance2(s, info, i - 1);
 +
 +	else
 +		r = rebalance3(s, info, i - 1);
 +
 +	return r;
 +}
 +
 +static int do_leaf(struct node *n, uint64_t key, unsigned *index)
 +{
 +	int i = lower_bound(n, key);
 +
 +	if ((i < 0) ||
 +	    (i >= le32_to_cpu(n->header.nr_entries)) ||
 +	    (le64_to_cpu(n->keys[i]) != key))
 +		return -ENODATA;
 +
 +	*index = i;
 +
 +	return 0;
 +}
 +
 +/*
 + * Prepares for removal from one level of the hierarchy.  The caller must
 + * actually call delete_at() to remove the entry at index.
 + */
 +static int remove_raw(struct shadow_spine *s, struct dm_btree_info *info,
 +		      struct dm_btree_value_type *vt, dm_block_t root,
 +		      uint64_t key, unsigned *index)
 +{
 +	int i = *index, inc, r;
 +	struct node *n;
 +
 +	for (;;) {
 +		r = shadow_step(s, root, vt, &inc);
 +		if (r < 0)
 +			break;
 +
 +		/*
 +		 * We have to patch up the parent node, ugly, but I don't
 +		 * see a way to do this automatically as part of the spine
 +		 * op.
 +		 */
 +		if (shadow_has_parent(s)) {
 +			__le64 location = cpu_to_le64(dm_block_location(shadow_current(s)));
 +			memcpy(value_ptr(dm_block_data(shadow_parent(s)), i, sizeof(uint64_t)),
 +			       &location, sizeof(__le64));
 +		}
 +
 +		n = dm_block_data(shadow_current(s));
 +		if (inc)
 +			inc_children(info->tm, n, vt);
 +
 +		if (le32_to_cpu(n->header.flags) & LEAF_NODE)
 +			return do_leaf(n, key, index);
 +
 +		r = rebalance_children(s, info, key);
 +		if (r)
 +			break;
 +
 +		n = dm_block_data(shadow_current(s));
 +		if (le32_to_cpu(n->header.flags) & LEAF_NODE)
 +			return do_leaf(n, key, index);
 +
 +		i = lower_bound(n, key);
 +
 +		/*
 +		 * We know the key is present, or else
 +		 * rebalance_children would have returned
 +		 * -ENODATA
 +		 */
 +		root = value64(n, i);
 +	}
 +
 +	return r;
 +}
 +
 +int dm_btree_remove(struct dm_btree_info *info, dm_block_t root,
 +		    uint64_t *keys, dm_block_t *new_root)
 +{
 +	unsigned level, last_level = info->levels - 1;
 +	int index = 0, r = 0;
 +	struct shadow_spine spine;
 +	struct node *n;
 +
 +	init_shadow_spine(&spine, info);
 +	for (level = 0; level < info->levels; level++) {
 +		r = remove_raw(&spine, info,
 +			       (level == last_level ?
 +				&info->value_type : &le64_type),
 +			       root, keys[level], (unsigned *)&index);
 +		if (r < 0)
 +			break;
 +
 +		n = dm_block_data(shadow_current(&spine));
 +		if (level != last_level) {
 +			root = value64(n, index);
 +			continue;
 +		}
 +
 +		BUG_ON(index < 0 || index >= le32_to_cpu(n->header.nr_entries));
 +
 +		if (info->value_type.dec)
 +			info->value_type.dec(info->value_type.context,
 +					     value_ptr(n, index, info->value_type.size));
 +
 +		delete_at(n, index, info->value_type.size);
 +
 +		r = 0;
 +		*new_root = shadow_root(&spine);
 +	}
 +
 +	exit_shadow_spine(&spine);
 +
 +	return r;
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_remove);
diff --cc drivers/md/persistent-data/dm-btree.c
index ca16d5b4799a,000000000000..408b762532a7
mode 100644,000000..100644
--- a/drivers/md/persistent-data/dm-btree.c
+++ b/drivers/md/persistent-data/dm-btree.c
@@@ -1,861 -1,0 +1,861 @@@
 +/*
 + * Copyright (C) 2011 Red Hat, Inc. All rights reserved.
 + *
 + * This file is released under the GPL.
 + */
 +
 +#include "dm-btree-internal.h"
 +#include "dm-space-map.h"
 +#include "dm-transaction-manager.h"
 +
- #include <linux/module.h>
++#include <linux/export.h>
 +#include <linux/device-mapper.h>
 +
 +#define DM_MSG_PREFIX "btree"
 +
 +/*----------------------------------------------------------------
 + * Array manipulation
 + *--------------------------------------------------------------*/
 +static void memcpy_disk(void *dest, const void *src, size_t len)
 +	__dm_written_to_disk(src)
 +{
 +	memcpy(dest, src, len);
 +	__dm_unbless_for_disk(src);
 +}
 +
 +static void array_insert(void *base, size_t elt_size, unsigned nr_elts,
 +			 unsigned index, void *elt)
 +	__dm_written_to_disk(elt)
 +{
 +	if (index < nr_elts)
 +		memmove(base + (elt_size * (index + 1)),
 +			base + (elt_size * index),
 +			(nr_elts - index) * elt_size);
 +
 +	memcpy_disk(base + (elt_size * index), elt, elt_size);
 +}
 +
 +/*----------------------------------------------------------------*/
 +
 +/* makes the assumption that no two keys are the same. */
 +static int bsearch(struct node *n, uint64_t key, int want_hi)
 +{
 +	int lo = -1, hi = le32_to_cpu(n->header.nr_entries);
 +
 +	while (hi - lo > 1) {
 +		int mid = lo + ((hi - lo) / 2);
 +		uint64_t mid_key = le64_to_cpu(n->keys[mid]);
 +
 +		if (mid_key == key)
 +			return mid;
 +
 +		if (mid_key < key)
 +			lo = mid;
 +		else
 +			hi = mid;
 +	}
 +
 +	return want_hi ? hi : lo;
 +}
 +
 +int lower_bound(struct node *n, uint64_t key)
 +{
 +	return bsearch(n, key, 0);
 +}
 +
 +void inc_children(struct dm_transaction_manager *tm, struct node *n,
 +		  struct dm_btree_value_type *vt)
 +{
 +	unsigned i;
 +	uint32_t nr_entries = le32_to_cpu(n->header.nr_entries);
 +
 +	if (le32_to_cpu(n->header.flags) & INTERNAL_NODE)
 +		for (i = 0; i < nr_entries; i++)
 +			dm_tm_inc(tm, value64(n, i));
 +	else if (vt->inc)
 +		for (i = 0; i < nr_entries; i++)
 +			vt->inc(vt->context,
 +				value_ptr(n, i, vt->size));
 +}
 +
 +static int insert_at(size_t value_size, struct node *node, unsigned index,
 +		      uint64_t key, void *value)
 +		      __dm_written_to_disk(value)
 +{
 +	uint32_t nr_entries = le32_to_cpu(node->header.nr_entries);
 +	__le64 key_le = cpu_to_le64(key);
 +
 +	if (index > nr_entries ||
 +	    index >= le32_to_cpu(node->header.max_entries)) {
 +		DMERR("too many entries in btree node for insert");
 +		__dm_unbless_for_disk(value);
 +		return -ENOMEM;
 +	}
 +
 +	__dm_bless_for_disk(&key_le);
 +
 +	array_insert(node->keys, sizeof(*node->keys), nr_entries, index, &key_le);
 +	array_insert(value_base(node), value_size, nr_entries, index, value);
 +	node->header.nr_entries = cpu_to_le32(nr_entries + 1);
 +
 +	return 0;
 +}
 +
 +/*----------------------------------------------------------------*/
 +
 +/*
 + * We want 3n entries (for some n).  This works more nicely for repeated
 + * insert remove loops than (2n + 1).
 + */
 +static uint32_t calc_max_entries(size_t value_size, size_t block_size)
 +{
 +	uint32_t total, n;
 +	size_t elt_size = sizeof(uint64_t) + value_size; /* key + value */
 +
 +	block_size -= sizeof(struct node_header);
 +	total = block_size / elt_size;
 +	n = total / 3;		/* rounds down */
 +
 +	return 3 * n;
 +}
 +
 +int dm_btree_create(struct dm_btree_info *info, dm_block_t *root)
 +{
 +	int r;
 +	struct dm_block *b;
 +	struct node *n;
 +	size_t block_size;
 +	uint32_t max_entries;
 +
 +	r = new_block(info, &b);
 +	if (r < 0)
 +		return r;
 +
 +	block_size = dm_bm_block_size(dm_tm_get_bm(info->tm));
 +	max_entries = calc_max_entries(info->value_type.size, block_size);
 +
 +	n = dm_block_data(b);
 +	memset(n, 0, block_size);
 +	n->header.flags = cpu_to_le32(LEAF_NODE);
 +	n->header.nr_entries = cpu_to_le32(0);
 +	n->header.max_entries = cpu_to_le32(max_entries);
 +	n->header.value_size = cpu_to_le32(info->value_type.size);
 +
 +	*root = dm_block_location(b);
 +
 +	return unlock_block(info, b);
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_create);
 +
 +/*----------------------------------------------------------------*/
 +
 +/*
 + * Deletion uses a recursive algorithm, since we have limited stack space
 + * we explicitly manage our own stack on the heap.
 + */
 +#define MAX_SPINE_DEPTH 64
 +struct frame {
 +	struct dm_block *b;
 +	struct node *n;
 +	unsigned level;
 +	unsigned nr_children;
 +	unsigned current_child;
 +};
 +
 +struct del_stack {
 +	struct dm_transaction_manager *tm;
 +	int top;
 +	struct frame spine[MAX_SPINE_DEPTH];
 +};
 +
 +static int top_frame(struct del_stack *s, struct frame **f)
 +{
 +	if (s->top < 0) {
 +		DMERR("btree deletion stack empty");
 +		return -EINVAL;
 +	}
 +
 +	*f = s->spine + s->top;
 +
 +	return 0;
 +}
 +
 +static int unprocessed_frames(struct del_stack *s)
 +{
 +	return s->top >= 0;
 +}
 +
 +static int push_frame(struct del_stack *s, dm_block_t b, unsigned level)
 +{
 +	int r;
 +	uint32_t ref_count;
 +
 +	if (s->top >= MAX_SPINE_DEPTH - 1) {
 +		DMERR("btree deletion stack out of memory");
 +		return -ENOMEM;
 +	}
 +
 +	r = dm_tm_ref(s->tm, b, &ref_count);
 +	if (r)
 +		return r;
 +
 +	if (ref_count > 1)
 +		/*
 +		 * This is a shared node, so we can just decrement its
 +		 * reference counter and leave the children.
 +		 */
 +		dm_tm_dec(s->tm, b);
 +
 +	else {
 +		struct frame *f = s->spine + ++s->top;
 +
 +		r = dm_tm_read_lock(s->tm, b, &btree_node_validator, &f->b);
 +		if (r) {
 +			s->top--;
 +			return r;
 +		}
 +
 +		f->n = dm_block_data(f->b);
 +		f->level = level;
 +		f->nr_children = le32_to_cpu(f->n->header.nr_entries);
 +		f->current_child = 0;
 +	}
 +
 +	return 0;
 +}
 +
 +static void pop_frame(struct del_stack *s)
 +{
 +	struct frame *f = s->spine + s->top--;
 +
 +	dm_tm_dec(s->tm, dm_block_location(f->b));
 +	dm_tm_unlock(s->tm, f->b);
 +}
 +
 +int dm_btree_destroy(struct dm_btree_info *info, dm_block_t root)
 +{
 +	int r;
 +	struct del_stack *s;
 +
 +	s = kmalloc(sizeof(*s), GFP_KERNEL);
 +	if (!s)
 +		return -ENOMEM;
 +
 +	s->tm = info->tm;
 +	s->top = -1;
 +
 +	r = push_frame(s, root, 1);
 +	if (r)
 +		goto out;
 +
 +	while (unprocessed_frames(s)) {
 +		uint32_t flags;
 +		struct frame *f;
 +		dm_block_t b;
 +
 +		r = top_frame(s, &f);
 +		if (r)
 +			goto out;
 +
 +		if (f->current_child >= f->nr_children) {
 +			pop_frame(s);
 +			continue;
 +		}
 +
 +		flags = le32_to_cpu(f->n->header.flags);
 +		if (flags & INTERNAL_NODE) {
 +			b = value64(f->n, f->current_child);
 +			f->current_child++;
 +			r = push_frame(s, b, f->level);
 +			if (r)
 +				goto out;
 +
 +		} else if (f->level != (info->levels - 1)) {
 +			b = value64(f->n, f->current_child);
 +			f->current_child++;
 +			r = push_frame(s, b, f->level + 1);
 +			if (r)
 +				goto out;
 +
 +		} else {
 +			if (info->value_type.dec) {
 +				unsigned i;
 +
 +				for (i = 0; i < f->nr_children; i++)
 +					info->value_type.dec(info->value_type.context,
 +							     value_ptr(f->n, i, info->value_type.size));
 +			}
 +			f->current_child = f->nr_children;
 +		}
 +	}
 +
 +out:
 +	kfree(s);
 +	return r;
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_destroy);
 +
 +// FIXME Implement or remove this fn before final submission.
 +int dm_btree_delete_gt(struct dm_btree_info *info, dm_block_t root, uint64_t *key,
 +		    dm_block_t *new_root)
 +{
 +	/* FIXME: implement */
 +	return 0;
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_delete_gt);
 +
 +/*----------------------------------------------------------------*/
 +
 +static int btree_lookup_raw(struct ro_spine *s, dm_block_t block, uint64_t key,
 +			    int (*search_fn)(struct node *, uint64_t),
 +			    uint64_t *result_key, void *v, size_t value_size)
 +{
 +	int i, r;
 +	uint32_t flags, nr_entries;
 +
 +	do {
 +		r = ro_step(s, block);
 +		if (r < 0)
 +			return r;
 +
 +		i = search_fn(ro_node(s), key);
 +
 +		flags = le32_to_cpu(ro_node(s)->header.flags);
 +		nr_entries = le32_to_cpu(ro_node(s)->header.nr_entries);
 +		if (i < 0 || i >= nr_entries)
 +			return -ENODATA;
 +
 +		if (flags & INTERNAL_NODE)
 +			block = value64(ro_node(s), i);
 +
 +	} while (!(flags & LEAF_NODE));
 +
 +	*result_key = le64_to_cpu(ro_node(s)->keys[i]);
 +	memcpy(v, value_ptr(ro_node(s), i, value_size), value_size);
 +
 +	return 0;
 +}
 +
 +int dm_btree_lookup(struct dm_btree_info *info, dm_block_t root,
 +		    uint64_t *keys, void *value_le)
 +{
 +	unsigned level, last_level = info->levels - 1;
 +	int r = -ENODATA;
 +	uint64_t rkey;
 +	__le64 internal_value_le;
 +	struct ro_spine spine;
 +
 +	init_ro_spine(&spine, info);
 +	for (level = 0; level < info->levels; level++) {
 +		size_t size;
 +		void *value_p;
 +
 +		if (level == last_level) {
 +			value_p = value_le;
 +			size = info->value_type.size;
 +
 +		} else {
 +			value_p = &internal_value_le;
 +			size = sizeof(uint64_t);
 +		}
 +
 +		r = btree_lookup_raw(&spine, root, keys[level],
 +				     lower_bound, &rkey,
 +				     value_p, size);
 +
 +		if (!r) {
 +			if (rkey != keys[level]) {
 +				exit_ro_spine(&spine);
 +				return -ENODATA;
 +			}
 +		} else {
 +			exit_ro_spine(&spine);
 +			return r;
 +		}
 +
 +		root = le64_to_cpu(internal_value_le);
 +	}
 +	exit_ro_spine(&spine);
 +
 +	return r;
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_lookup);
 +
 +/*
 + * Splits a node by creating a sibling node and shifting half the nodes
 + * contents across.  Assumes there is a parent node, and it has room for
 + * another child.
 + *
 + * Before:
 + *	  +--------+
 + *	  | Parent |
 + *	  +--------+
 + *	     |
 + *	     v
 + *	+----------+
 + *	| A ++++++ |
 + *	+----------+
 + *
 + *
 + * After:
 + *		+--------+
 + *		| Parent |
 + *		+--------+
 + *		  |	|
 + *		  v	+------+
 + *	    +---------+	       |
 + *	    | A* +++  |	       v
 + *	    +---------+	  +-------+
 + *			  | B +++ |
 + *			  +-------+
 + *
 + * Where A* is a shadow of A.
 + */
 +static int btree_split_sibling(struct shadow_spine *s, dm_block_t root,
 +			       unsigned parent_index, uint64_t key)
 +{
 +	int r;
 +	size_t size;
 +	unsigned nr_left, nr_right;
 +	struct dm_block *left, *right, *parent;
 +	struct node *ln, *rn, *pn;
 +	__le64 location;
 +
 +	left = shadow_current(s);
 +
 +	r = new_block(s->info, &right);
 +	if (r < 0)
 +		return r;
 +
 +	ln = dm_block_data(left);
 +	rn = dm_block_data(right);
 +
 +	nr_left = le32_to_cpu(ln->header.nr_entries) / 2;
 +	nr_right = le32_to_cpu(ln->header.nr_entries) - nr_left;
 +
 +	ln->header.nr_entries = cpu_to_le32(nr_left);
 +
 +	rn->header.flags = ln->header.flags;
 +	rn->header.nr_entries = cpu_to_le32(nr_right);
 +	rn->header.max_entries = ln->header.max_entries;
 +	rn->header.value_size = ln->header.value_size;
 +	memcpy(rn->keys, ln->keys + nr_left, nr_right * sizeof(rn->keys[0]));
 +
 +	size = le32_to_cpu(ln->header.flags) & INTERNAL_NODE ?
 +		sizeof(uint64_t) : s->info->value_type.size;
 +	memcpy(value_ptr(rn, 0, size), value_ptr(ln, nr_left, size),
 +	       size * nr_right);
 +
 +	/*
 +	 * Patch up the parent
 +	 */
 +	parent = shadow_parent(s);
 +
 +	pn = dm_block_data(parent);
 +	location = cpu_to_le64(dm_block_location(left));
 +	__dm_bless_for_disk(&location);
 +	memcpy_disk(value_ptr(pn, parent_index, sizeof(__le64)),
 +		    &location, sizeof(__le64));
 +
 +	location = cpu_to_le64(dm_block_location(right));
 +	__dm_bless_for_disk(&location);
 +
 +	r = insert_at(sizeof(__le64), pn, parent_index + 1,
 +		      le64_to_cpu(rn->keys[0]), &location);
 +	if (r)
 +		return r;
 +
 +	if (key < le64_to_cpu(rn->keys[0])) {
 +		unlock_block(s->info, right);
 +		s->nodes[1] = left;
 +	} else {
 +		unlock_block(s->info, left);
 +		s->nodes[1] = right;
 +	}
 +
 +	return 0;
 +}
 +
 +/*
 + * Splits a node by creating two new children beneath the given node.
 + *
 + * Before:
 + *	  +----------+
 + *	  | A ++++++ |
 + *	  +----------+
 + *
 + *
 + * After:
 + *	+------------+
 + *	| A (shadow) |
 + *	+------------+
 + *	    |	|
 + *   +------+	+----+
 + *   |		     |
 + *   v		     v
 + * +-------+	 +-------+
 + * | B +++ |	 | C +++ |
 + * +-------+	 +-------+
 + */
 +static int btree_split_beneath(struct shadow_spine *s, uint64_t key)
 +{
 +	int r;
 +	size_t size;
 +	unsigned nr_left, nr_right;
 +	struct dm_block *left, *right, *new_parent;
 +	struct node *pn, *ln, *rn;
 +	__le64 val;
 +
 +	new_parent = shadow_current(s);
 +
 +	r = new_block(s->info, &left);
 +	if (r < 0)
 +		return r;
 +
 +	r = new_block(s->info, &right);
 +	if (r < 0) {
 +		/* FIXME: put left */
 +		return r;
 +	}
 +
 +	pn = dm_block_data(new_parent);
 +	ln = dm_block_data(left);
 +	rn = dm_block_data(right);
 +
 +	nr_left = le32_to_cpu(pn->header.nr_entries) / 2;
 +	nr_right = le32_to_cpu(pn->header.nr_entries) - nr_left;
 +
 +	ln->header.flags = pn->header.flags;
 +	ln->header.nr_entries = cpu_to_le32(nr_left);
 +	ln->header.max_entries = pn->header.max_entries;
 +	ln->header.value_size = pn->header.value_size;
 +
 +	rn->header.flags = pn->header.flags;
 +	rn->header.nr_entries = cpu_to_le32(nr_right);
 +	rn->header.max_entries = pn->header.max_entries;
 +	rn->header.value_size = pn->header.value_size;
 +
 +	memcpy(ln->keys, pn->keys, nr_left * sizeof(pn->keys[0]));
 +	memcpy(rn->keys, pn->keys + nr_left, nr_right * sizeof(pn->keys[0]));
 +
 +	size = le32_to_cpu(pn->header.flags) & INTERNAL_NODE ?
 +		sizeof(__le64) : s->info->value_type.size;
 +	memcpy(value_ptr(ln, 0, size), value_ptr(pn, 0, size), nr_left * size);
 +	memcpy(value_ptr(rn, 0, size), value_ptr(pn, nr_left, size),
 +	       nr_right * size);
 +
 +	/* new_parent should just point to l and r now */
 +	pn->header.flags = cpu_to_le32(INTERNAL_NODE);
 +	pn->header.nr_entries = cpu_to_le32(2);
 +	pn->header.max_entries = cpu_to_le32(
 +		calc_max_entries(sizeof(__le64),
 +				 dm_bm_block_size(
 +					 dm_tm_get_bm(s->info->tm))));
 +	pn->header.value_size = cpu_to_le32(sizeof(__le64));
 +
 +	val = cpu_to_le64(dm_block_location(left));
 +	__dm_bless_for_disk(&val);
 +	pn->keys[0] = ln->keys[0];
 +	memcpy_disk(value_ptr(pn, 0, sizeof(__le64)), &val, sizeof(__le64));
 +
 +	val = cpu_to_le64(dm_block_location(right));
 +	__dm_bless_for_disk(&val);
 +	pn->keys[1] = rn->keys[0];
 +	memcpy_disk(value_ptr(pn, 1, sizeof(__le64)), &val, sizeof(__le64));
 +
 +	/*
 +	 * rejig the spine.  This is ugly, since it knows too
 +	 * much about the spine
 +	 */
 +	if (s->nodes[0] != new_parent) {
 +		unlock_block(s->info, s->nodes[0]);
 +		s->nodes[0] = new_parent;
 +	}
 +	if (key < le64_to_cpu(rn->keys[0])) {
 +		unlock_block(s->info, right);
 +		s->nodes[1] = left;
 +	} else {
 +		unlock_block(s->info, left);
 +		s->nodes[1] = right;
 +	}
 +	s->count = 2;
 +
 +	return 0;
 +}
 +
 +static int btree_insert_raw(struct shadow_spine *s, dm_block_t root,
 +			    struct dm_btree_value_type *vt,
 +			    uint64_t key, unsigned *index)
 +{
 +	int r, i = *index, inc, top = 1;
 +	struct node *node;
 +
 +	for (;;) {
 +		r = shadow_step(s, root, vt, &inc);
 +		if (r < 0)
 +			return r;
 +
 +		node = dm_block_data(shadow_current(s));
 +		if (inc)
 +			inc_children(s->info->tm, node, vt);
 +
 +		/*
 +		 * We have to patch up the parent node, ugly, but I don't
 +		 * see a way to do this automatically as part of the spine
 +		 * op.
 +		 */
 +		if (shadow_has_parent(s) && i >= 0) { /* FIXME: second clause unness. */
 +			__le64 location = cpu_to_le64(dm_block_location(shadow_current(s)));
 +
 +			__dm_bless_for_disk(&location);
 +			memcpy_disk(value_ptr(dm_block_data(shadow_parent(s)), i, sizeof(uint64_t)),
 +				    &location, sizeof(__le64));
 +		}
 +
 +		node = dm_block_data(shadow_current(s));
 +
 +		if (node->header.nr_entries == node->header.max_entries) {
 +			if (top)
 +				r = btree_split_beneath(s, key);
 +			else
 +				r = btree_split_sibling(s, root, i, key);
 +
 +			if (r < 0)
 +				return r;
 +		}
 +
 +		node = dm_block_data(shadow_current(s));
 +
 +		i = lower_bound(node, key);
 +
 +		if (le32_to_cpu(node->header.flags) & LEAF_NODE)
 +			break;
 +
 +		if (i < 0) {
 +			/* change the bounds on the lowest key */
 +			node->keys[0] = cpu_to_le64(key);
 +			i = 0;
 +		}
 +
 +		root = value64(node, i);
 +		top = 0;
 +	}
 +
 +	if (i < 0 || le64_to_cpu(node->keys[i]) != key)
 +		i++;
 +
 +	/* we're about to overwrite this value, so undo the increment for it */
 +	/* FIXME: shame that inc information is leaking outside the spine.
 +	 * Plus inc is just plain wrong in the event of a split */
 +	if (le64_to_cpu(node->keys[i]) == key && inc)
 +		if (vt->dec)
 +			vt->dec(vt->context, value_ptr(node, i, vt->size));
 +
 +	*index = i;
 +	return 0;
 +}
 +
 +static int insert(struct dm_btree_info *info, dm_block_t root,
 +		  uint64_t *keys, void *value, dm_block_t *new_root,
 +		  int *inserted)
 +		  __dm_written_to_disk(value)
 +{
 +	int r, need_insert;
 +	unsigned level, index = -1, last_level = info->levels - 1;
 +	dm_block_t block = root;
 +	struct shadow_spine spine;
 +	struct node *n;
 +	struct dm_btree_value_type le64_type;
 +
 +	le64_type.context = NULL;
 +	le64_type.size = sizeof(__le64);
 +	le64_type.inc = NULL;
 +	le64_type.dec = NULL;
 +	le64_type.equal = NULL;
 +
 +	init_shadow_spine(&spine, info);
 +
 +	for (level = 0; level < (info->levels - 1); level++) {
 +		r = btree_insert_raw(&spine, block, &le64_type, keys[level], &index);
 +		if (r < 0)
 +			goto bad;
 +
 +		n = dm_block_data(shadow_current(&spine));
 +		need_insert = ((index >= le32_to_cpu(n->header.nr_entries)) ||
 +			       (le64_to_cpu(n->keys[index]) != keys[level]));
 +
 +		if (need_insert) {
 +			dm_block_t new_tree;
 +			__le64 new_le;
 +
 +			r = dm_btree_create(info, &new_tree);
 +			if (r < 0)
 +				goto bad;
 +
 +			new_le = cpu_to_le64(new_tree);
 +			__dm_bless_for_disk(&new_le);
 +
 +			r = insert_at(sizeof(uint64_t), n, index,
 +				      keys[level], &new_le);
 +			if (r)
 +				goto bad;
 +		}
 +
 +		if (level < last_level)
 +			block = value64(n, index);
 +	}
 +
 +	r = btree_insert_raw(&spine, block, &info->value_type,
 +			     keys[level], &index);
 +	if (r < 0)
 +		goto bad;
 +
 +	n = dm_block_data(shadow_current(&spine));
 +	need_insert = ((index >= le32_to_cpu(n->header.nr_entries)) ||
 +		       (le64_to_cpu(n->keys[index]) != keys[level]));
 +
 +	if (need_insert) {
 +		if (inserted)
 +			*inserted = 1;
 +
 +		r = insert_at(info->value_type.size, n, index,
 +			      keys[level], value);
 +		if (r)
 +			goto bad_unblessed;
 +	} else {
 +		if (inserted)
 +			*inserted = 0;
 +
 +		if (info->value_type.dec &&
 +		    (!info->value_type.equal ||
 +		     !info->value_type.equal(
 +			     info->value_type.context,
 +			     value_ptr(n, index, info->value_type.size),
 +			     value))) {
 +			info->value_type.dec(info->value_type.context,
 +					     value_ptr(n, index, info->value_type.size));
 +		}
 +		memcpy_disk(value_ptr(n, index, info->value_type.size),
 +			    value, info->value_type.size);
 +	}
 +
 +	*new_root = shadow_root(&spine);
 +	exit_shadow_spine(&spine);
 +
 +	return 0;
 +
 +bad:
 +	__dm_unbless_for_disk(value);
 +bad_unblessed:
 +	exit_shadow_spine(&spine);
 +	return r;
 +}
 +
 +int dm_btree_insert(struct dm_btree_info *info, dm_block_t root,
 +		    uint64_t *keys, void *value, dm_block_t *new_root)
 +		    __dm_written_to_disk(value)
 +{
 +	return insert(info, root, keys, value, new_root, NULL);
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_insert);
 +
 +int dm_btree_insert_notify(struct dm_btree_info *info, dm_block_t root,
 +			   uint64_t *keys, void *value, dm_block_t *new_root,
 +			   int *inserted)
 +			   __dm_written_to_disk(value)
 +{
 +	return insert(info, root, keys, value, new_root, inserted);
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_insert_notify);
 +
 +/*----------------------------------------------------------------*/
 +
 +int dm_btree_clone(struct dm_btree_info *info, dm_block_t root,
 +		   dm_block_t *clone)
 +{
 +	int r;
 +	struct dm_block *b, *orig_b;
 +	struct node *b_node, *orig_node;
 +
 +	/* Copy the root node */
 +	r = new_block(info, &b);
 +	if (r < 0)
 +		return r;
 +
 +	r = dm_tm_read_lock(info->tm, root, &btree_node_validator, &orig_b);
 +	if (r < 0) {
 +		dm_block_t location = dm_block_location(b);
 +
 +		unlock_block(info, b);
 +		dm_tm_dec(info->tm, location);
 +	}
 +
 +	*clone = dm_block_location(b);
 +	b_node = dm_block_data(b);
 +	orig_node = dm_block_data(orig_b);
 +
 +	memcpy(b_node, orig_node,
 +	       dm_bm_block_size(dm_tm_get_bm(info->tm)));
 +	dm_tm_unlock(info->tm, orig_b);
 +	inc_children(info->tm, b_node, &info->value_type);
 +	dm_tm_unlock(info->tm, b);
 +
 +	return 0;
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_clone);
 +
 +/*----------------------------------------------------------------*/
 +
 +static int find_highest_key(struct ro_spine *s, dm_block_t block,
 +			    uint64_t *result_key, dm_block_t *next_block)
 +{
 +	int i, r;
 +	uint32_t flags;
 +
 +	do {
 +		r = ro_step(s, block);
 +		if (r < 0)
 +			return r;
 +
 +		flags = le32_to_cpu(ro_node(s)->header.flags);
 +		i = le32_to_cpu(ro_node(s)->header.nr_entries);
 +		if (!i)
 +			return -ENODATA;
 +		else
 +			i--;
 +
 +		*result_key = le64_to_cpu(ro_node(s)->keys[i]);
 +		if (next_block || flags & INTERNAL_NODE)
 +			block = value64(ro_node(s), i);
 +
 +	} while (flags & INTERNAL_NODE);
 +
 +	if (next_block)
 +		*next_block = block;
 +	return 0;
 +}
 +
 +int dm_btree_find_highest_key(struct dm_btree_info *info, dm_block_t root,
 +			      uint64_t *result_keys)
 +{
 +	int r = 0, count = 0, level;
 +	struct ro_spine spine;
 +
 +	init_ro_spine(&spine, info);
 +	for (level = 0; level < info->levels; level++) {
 +		r = find_highest_key(&spine, root, result_keys + level,
 +				     level == info->levels - 1 ? NULL : &root);
 +		if (r == -ENODATA) {
 +			r = 0;
 +			break;
 +
 +		} else if (r)
 +			break;
 +
 +		count++;
 +	}
 +	exit_ro_spine(&spine);
 +
 +	return r ? r : count;
 +}
 +EXPORT_SYMBOL_GPL(dm_btree_find_highest_key);
diff --cc drivers/md/persistent-data/dm-space-map-disk.c
index 6229a4e68f88,000000000000..e6b9d67270ee
mode 100644,000000..100644
--- a/drivers/md/persistent-data/dm-space-map-disk.c
+++ b/drivers/md/persistent-data/dm-space-map-disk.c
@@@ -1,663 -1,0 +1,663 @@@
 +/*
 + * Copyright (C) 2011 Red Hat, Inc. All rights reserved.
 + *
 + * This file is released under the GPL.
 + */
 +
 +#include "dm-space-map-common.h"
 +#include "dm-space-map-disk.h"
 +#include "dm-space-map.h"
 +#include "dm-transaction-manager.h"
 +
 +#include <linux/list.h>
 +#include <linux/slab.h>
 +#include <linux/bitops.h>
- #include <linux/module.h>
++#include <linux/export.h>
 +#include <linux/device-mapper.h>
 +
 +#define DM_MSG_PREFIX "space map disk"
 +
 +/*
 + * Bitmap validator
 + */
 +static void bitmap_prepare_for_write(struct dm_block_validator *v,
 +				     struct dm_block *b,
 +				     size_t block_size)
 +{
 +	struct disk_bitmap_header *disk_header = dm_block_data(b);
 +
 +	disk_header->blocknr = cpu_to_le64(dm_block_location(b));
 +	disk_header->csum = cpu_to_le32(dm_block_csum_data(&disk_header->not_used, block_size - sizeof(__le32)));
 +}
 +
 +static int bitmap_check(struct dm_block_validator *v,
 +			struct dm_block *b,
 +			size_t block_size)
 +{
 +	struct disk_bitmap_header *disk_header = dm_block_data(b);
 +	__le32 csum_disk;
 +
 +	if (dm_block_location(b) != le64_to_cpu(disk_header->blocknr)) {
 +		DMERR("bitmap check failed blocknr %llu wanted %llu",
 +		      le64_to_cpu(disk_header->blocknr), dm_block_location(b));
 +		return -ENOTBLK;
 +	}
 +
 +	csum_disk = cpu_to_le32(dm_block_csum_data(&disk_header->not_used, block_size - sizeof(__le32)));
 +	if (csum_disk != disk_header->csum) {
 +		DMERR("bitmap check failed csum %u wanted %u",
 +		      le32_to_cpu(csum_disk), le32_to_cpu(disk_header->csum));
 +		return -EILSEQ;
 +	}
 +
 +	return 0;
 +}
 +
 +struct dm_block_validator dm_sm_bitmap_validator = {
 +	.name = "sm_bitmap",
 +	.prepare_for_write = bitmap_prepare_for_write,
 +	.check = bitmap_check
 +};
 +
 +/*----------------------------------------------------------------*/
 +
 +#define ENTRIES_PER_WORD 32
 +#define ENTRIES_SHIFT	5
 +
 +void *dm_bitmap_data(struct dm_block *b)
 +{
 +	return dm_block_data(b) + sizeof(struct disk_bitmap_header);
 +}
 +
 +#define WORD_MASK_LOW 0x5555555555555555ULL
 +#define WORD_MASK_HIGH 0xAAAAAAAAAAAAAAAAULL
 +#define WORD_MASK_ALL 0xFFFFFFFFFFFFFFFFULL
 +
 +static unsigned bitmap_word_used(void *addr, unsigned b)
 +{
 +	__le64 *words_le = addr;
 +	__le64 *w_le = words_le + (b >> ENTRIES_SHIFT);
 +
 +	uint64_t bits = le64_to_cpu(*w_le);
 +
 +	return ((bits & WORD_MASK_LOW) == WORD_MASK_LOW ||
 +		(bits & WORD_MASK_HIGH) == WORD_MASK_HIGH ||
 +		(bits & WORD_MASK_ALL) == WORD_MASK_ALL);
 +}
 +
 +unsigned sm_lookup_bitmap(void *addr, unsigned b)
 +{
 +	__le64 *words_le = addr;
 +	__le64 *w_le = words_le + (b >> ENTRIES_SHIFT);
 +
 +	b = (b & (ENTRIES_PER_WORD - 1)) << 1;
 +
 +	return (!!test_bit_le(b, (void *) w_le) << 1) |
 +		(!!test_bit_le(b + 1, (void *) w_le));
 +}
 +
 +void sm_set_bitmap(void *addr, unsigned b, unsigned val)
 +{
 +	__le64 *words_le = addr;
 +	__le64 *w_le = words_le + (b >> ENTRIES_SHIFT);
 +
 +	b = (b & (ENTRIES_PER_WORD - 1)) << 1;
 +
 +	if (val & 2)
 +		__set_bit_le(b, (void *) w_le);
 +	else
 +		__clear_bit_le(b, (void *) w_le);
 +
 +	if (val & 1)
 +		__set_bit_le(b + 1, (void *) w_le);
 +	else
 +		__clear_bit_le(b + 1, (void *) w_le);
 +}
 +
 +int sm_find_free(void *addr, unsigned begin, unsigned end,
 +		 unsigned *result)
 +{
 +	while (begin < end) {
 +		if (!(begin & (ENTRIES_PER_WORD - 1)) &&
 +		    bitmap_word_used(addr, begin)) {
 +			begin += ENTRIES_PER_WORD;
 +			continue;
 +		}
 +
 +		if (!sm_lookup_bitmap(addr, begin)) {
 +			*result = begin;
 +			return 0;
 +		}
 +
 +		begin++;
 +	}
 +
 +	return -ENOSPC;
 +}
 +
 +static int disk_ll_init(struct ll_disk *io, struct dm_transaction_manager *tm)
 +{
 +	io->tm = tm;
 +	io->bitmap_info.tm = tm;
 +	io->bitmap_info.levels = 1;
 +
 +	/*
 +	 * Because the new bitmap blocks are created via a shadow
 +	 * operation, the old entry has already had its reference count
 +	 * decremented and we don't need the btree to do any bookkeeping.
 +	 */
 +	io->bitmap_info.value_type.size = sizeof(struct disk_index_entry);
 +	io->bitmap_info.value_type.inc = NULL;
 +	io->bitmap_info.value_type.dec = NULL;
 +	io->bitmap_info.value_type.equal = NULL;
 +
 +	io->ref_count_info.tm = tm;
 +	io->ref_count_info.levels = 1;
 +	io->ref_count_info.value_type.size = sizeof(uint32_t);
 +	io->ref_count_info.value_type.inc = NULL;
 +	io->ref_count_info.value_type.dec = NULL;
 +	io->ref_count_info.value_type.equal = NULL;
 +
 +	io->block_size = dm_bm_block_size(dm_tm_get_bm(tm));
 +
 +	if (io->block_size > (1 << 30)) {
 +		DMERR("block size too big to hold bitmaps");
 +		return -EINVAL;
 +	}
 +
 +	io->entries_per_block = (io->block_size - sizeof(struct disk_bitmap_header)) *
 +				ENTRIES_PER_BYTE;
 +	io->nr_blocks = 0;
 +	io->bitmap_root = 0;
 +	io->ref_count_root = 0;
 +
 +	return 0;
 +}
 +
 +static int disk_ll_new(struct ll_disk *io, struct dm_transaction_manager *tm)
 +{
 +	int r;
 +
 +	r = disk_ll_init(io, tm);
 +	if (r < 0)
 +		return r;
 +
 +	io->nr_blocks = 0;
 +	io->nr_allocated = 0;
 +	r = dm_btree_create(&io->bitmap_info, &io->bitmap_root);
 +	if (r < 0)
 +		return r;
 +
 +	r = dm_btree_create(&io->ref_count_info, &io->ref_count_root);
 +	if (r < 0) {
 +		dm_btree_destroy(&io->bitmap_info, io->bitmap_root);
 +		return r;
 +	}
 +
 +	return 0;
 +}
 +
 +static int disk_ll_extend(struct ll_disk *io, dm_block_t extra_blocks)
 +{
 +	int r;
 +	dm_block_t i, nr_blocks;
 +	unsigned old_blocks, blocks;
 +
 +	nr_blocks = io->nr_blocks + extra_blocks;
 +	old_blocks = dm_sector_div_up(io->nr_blocks, io->entries_per_block);
 +	blocks = dm_sector_div_up(nr_blocks, io->entries_per_block);
 +
 +	for (i = old_blocks; i < blocks; i++) {
 +		struct dm_block *b;
 +		struct disk_index_entry idx;
 +
 +		r = dm_tm_new_block(io->tm, &dm_sm_bitmap_validator, &b);
 +		if (r < 0)
 +			return r;
 +		idx.blocknr = cpu_to_le64(dm_block_location(b));
 +
 +		r = dm_tm_unlock(io->tm, b);
 +		if (r < 0)
 +			return r;
 +
 +		idx.nr_free = cpu_to_le32(io->entries_per_block);
 +		idx.none_free_before = 0;
 +		__dm_bless_for_disk(&idx);
 +
 +		r = dm_btree_insert(&io->bitmap_info, io->bitmap_root,
 +				    &i, &idx, &io->bitmap_root);
 +		if (r < 0)
 +			return r;
 +	}
 +
 +	io->nr_blocks = nr_blocks;
 +	return 0;
 +}
 +
 +static int disk_ll_open(struct ll_disk *ll, struct dm_transaction_manager *tm,
 +			void *root_le, size_t len)
 +{
 +	int r;
 +	struct disk_sm_root *smr = root_le;
 +
 +	if (len < sizeof(struct disk_sm_root)) {
 +		DMERR("sm_disk root too small");
 +		return -ENOMEM;
 +	}
 +
 +	r = disk_ll_init(ll, tm);
 +	if (r < 0)
 +		return r;
 +
 +	ll->nr_blocks = le64_to_cpu(smr->nr_blocks);
 +	ll->nr_allocated = le64_to_cpu(smr->nr_allocated);
 +	ll->bitmap_root = le64_to_cpu(smr->bitmap_root);
 +	ll->ref_count_root = le64_to_cpu(smr->ref_count_root);
 +
 +	return 0;
 +}
 +
 +static int disk_ll_lookup_bitmap(struct ll_disk *io, dm_block_t b, uint32_t *result)
 +{
 +	int r;
 +	dm_block_t index = b;
 +	struct disk_index_entry ie_disk;
 +	struct dm_block *blk;
 +
 +	do_div(index, io->entries_per_block);
 +	r = dm_btree_lookup(&io->bitmap_info, io->bitmap_root, &index, &ie_disk);
 +	if (r < 0)
 +		return r;
 +
 +	r = dm_tm_read_lock(io->tm, le64_to_cpu(ie_disk.blocknr), &dm_sm_bitmap_validator, &blk);
 +	if (r < 0)
 +		return r;
 +
 +	*result = sm_lookup_bitmap(dm_bitmap_data(blk), do_div(b, io->entries_per_block));
 +
 +	return dm_tm_unlock(io->tm, blk);
 +}
 +
 +static int disk_ll_lookup(struct ll_disk *io, dm_block_t b, uint32_t *result)
 +{
 +	__le32 rc_le;
 +	int r = disk_ll_lookup_bitmap(io, b, result);
 +
 +	if (r)
 +		return r;
 +
 +	if (*result != 3)
 +		return r;
 +
 +	r = dm_btree_lookup(&io->ref_count_info, io->ref_count_root, &b, &rc_le);
 +	if (r < 0)
 +		return r;
 +
 +	*result = le32_to_cpu(rc_le);
 +
 +	return r;
 +}
 +
 +static int disk_ll_find_free_block(struct ll_disk *io, dm_block_t begin,
 +				   dm_block_t end, dm_block_t *result)
 +{
 +	int r;
 +	struct disk_index_entry ie_disk;
 +	dm_block_t i, index_begin = begin;
 +	dm_block_t index_end = dm_sector_div_up(end, io->entries_per_block);
 +
 +	begin = do_div(index_begin, io->entries_per_block);
 +
 +	for (i = index_begin; i < index_end; i++, begin = 0) {
 +		struct dm_block *blk;
 +		unsigned position;
 +		uint32_t bit_end;
 +
 +		r = dm_btree_lookup(&io->bitmap_info, io->bitmap_root, &i, &ie_disk);
 +		if (r < 0)
 +			return r;
 +
 +		if (le32_to_cpu(ie_disk.nr_free) <= 0)
 +			continue;
 +
 +		r = dm_tm_read_lock(io->tm, le64_to_cpu(ie_disk.blocknr),
 +				    &dm_sm_bitmap_validator, &blk);
 +		if (r < 0)
 +			return r;
 +
 +		bit_end = (i == index_end - 1) ?
 +			do_div(end, io->entries_per_block) : io->entries_per_block;
 +
 +		r = sm_find_free(dm_bitmap_data(blk),
 +				 max((unsigned)begin, (unsigned)le32_to_cpu(ie_disk.none_free_before)),
 +				 bit_end, &position);
 +		if (r < 0) {
 +			dm_tm_unlock(io->tm, blk);
 +			continue;
 +		}
 +
 +		r = dm_tm_unlock(io->tm, blk);
 +		if (r < 0)
 +			return r;
 +
 +		*result = i * io->entries_per_block + (dm_block_t) position;
 +
 +		return 0;
 +	}
 +
 +	return -ENOSPC;
 +}
 +
 +static int disk_ll_insert(struct ll_disk *io, dm_block_t b, uint32_t ref_count)
 +{
 +	int r;
 +	uint32_t bit, old;
 +	struct dm_block *nb;
 +	dm_block_t index = b;
 +	struct disk_index_entry ie_disk;
 +	void *bm_le;
 +	int inc;
 +
 +	do_div(index, io->entries_per_block);
 +	r = dm_btree_lookup(&io->bitmap_info, io->bitmap_root, &index, &ie_disk);
 +	if (r < 0)
 +		return r;
 +
 +	r = dm_tm_shadow_block(io->tm, le64_to_cpu(ie_disk.blocknr),
 +			       &dm_sm_bitmap_validator, &nb, &inc);
 +	if (r < 0) {
 +		DMERR("dm_tm_shadow_block() failed");
 +		return r;
 +	}
 +	ie_disk.blocknr = cpu_to_le64(dm_block_location(nb));
 +
 +	bm_le = dm_bitmap_data(nb);
 +	bit = do_div(b, io->entries_per_block);
 +	old = sm_lookup_bitmap(bm_le, bit);
 +
 +	if (ref_count <= 2) {
 +		sm_set_bitmap(bm_le, bit, ref_count);
 +
 +		if (old > 2) {
 +			r = dm_btree_remove(&io->ref_count_info, io->ref_count_root,
 +					    &b, &io->ref_count_root);
 +			if (r) {
 +				dm_tm_unlock(io->tm, nb);
 +				return r;
 +			}
 +		}
 +	} else {
 +		__le32 rc_le = cpu_to_le32(ref_count);
 +
 +		__dm_bless_for_disk(&rc_le);
 +
 +		sm_set_bitmap(bm_le, bit, 3);
 +		r = dm_btree_insert(&io->ref_count_info, io->ref_count_root,
 +				    &b, &rc_le, &io->ref_count_root);
 +		if (r < 0) {
 +			dm_tm_unlock(io->tm, nb);
 +			DMERR("ref count insert failed");
 +			return r;
 +		}
 +	}
 +
 +	r = dm_tm_unlock(io->tm, nb);
 +	if (r < 0)
 +		return r;
 +
 +	if (ref_count && !old) {
 +		io->nr_allocated++;
 +		ie_disk.nr_free = cpu_to_le32(le32_to_cpu(ie_disk.nr_free) - 1);
 +		if (le32_to_cpu(ie_disk.none_free_before) == b)
 +			ie_disk.none_free_before = cpu_to_le32(b + 1);
 +
 +	} else if (old && !ref_count) {
 +		io->nr_allocated--;
 +		ie_disk.nr_free = cpu_to_le32(le32_to_cpu(ie_disk.nr_free) + 1);
 +		ie_disk.none_free_before = cpu_to_le32(min((dm_block_t) le32_to_cpu(ie_disk.none_free_before), b));
 +	}
 +
 +	__dm_bless_for_disk(&ie_disk);
 +
 +	r = dm_btree_insert(&io->bitmap_info, io->bitmap_root, &index, &ie_disk, &io->bitmap_root);
 +	if (r < 0)
 +		return r;
 +
 +	return 0;
 +}
 +
 +static int disk_ll_inc(struct ll_disk *ll, dm_block_t b)
 +{
 +	int r;
 +	uint32_t rc;
 +
 +	r = disk_ll_lookup(ll, b, &rc);
 +	if (r)
 +		return r;
 +
 +	return disk_ll_insert(ll, b, rc + 1);
 +}
 +
 +static int disk_ll_dec(struct ll_disk *ll, dm_block_t b)
 +{
 +	int r;
 +	uint32_t rc;
 +
 +	r = disk_ll_lookup(ll, b, &rc);
 +	if (r)
 +		return r;
 +
 +	if (!rc)
 +		return -EINVAL;
 +
 +	return disk_ll_insert(ll, b, rc - 1);
 +}
 +
 +/*--------------------------------------------------------------*/
 +
 +/*
 + * Space map interface.
 + */
 +struct sm_disk {
 +	struct dm_space_map sm;
 +
 +	struct ll_disk ll;
 +};
 +
 +static void sm_disk_destroy(struct dm_space_map *sm)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	kfree(smd);
 +}
 +
 +static int sm_disk_extend(struct dm_space_map *sm, dm_block_t extra_blocks)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	return disk_ll_extend(&smd->ll, extra_blocks);
 +}
 +
 +static int sm_disk_get_nr_blocks(struct dm_space_map *sm, dm_block_t *count)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	*count = smd->ll.nr_blocks;
 +
 +	return 0;
 +}
 +
 +static int sm_disk_get_nr_free(struct dm_space_map *sm, dm_block_t *count)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	*count = smd->ll.nr_blocks - smd->ll.nr_allocated;
 +
 +	return 0;
 +}
 +
 +static int sm_disk_get_count(struct dm_space_map *sm, dm_block_t b,
 +			     uint32_t *result)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	return disk_ll_lookup(&smd->ll, b, result);
 +}
 +
 +static int sm_disk_count_is_more_than_one(struct dm_space_map *sm, dm_block_t b,
 +					  int *result)
 +{
 +	int r;
 +	uint32_t count;
 +
 +	r = sm_disk_get_count(sm, b, &count);
 +	if (r)
 +		return r;
 +
 +	return count > 1;
 +}
 +
 +static int sm_disk_set_count(struct dm_space_map *sm, dm_block_t b,
 +			     uint32_t count)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	return disk_ll_insert(&smd->ll, b, count);
 +}
 +
 +static int sm_disk_inc_block(struct dm_space_map *sm, dm_block_t b)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	return disk_ll_inc(&smd->ll, b);
 +}
 +
 +static int sm_disk_dec_block(struct dm_space_map *sm, dm_block_t b)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	return disk_ll_dec(&smd->ll, b);
 +}
 +
 +static int sm_disk_new_block(struct dm_space_map *sm, dm_block_t *b)
 +{
 +	int r;
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +
 +	/*
 +	 * FIXME: We should start the search where we left off.
 +	 */
 +	r = disk_ll_find_free_block(&smd->ll, 0, smd->ll.nr_blocks, b);
 +	if (r)
 +		return r;
 +
 +	return disk_ll_inc(&smd->ll, *b);
 +}
 +
 +static int sm_disk_commit(struct dm_space_map *sm)
 +{
 +	return 0;
 +}
 +
 +static int sm_disk_root_size(struct dm_space_map *sm, size_t *result)
 +{
 +	*result = sizeof(struct disk_sm_root);
 +
 +	return 0;
 +}
 +
 +static int sm_disk_copy_root(struct dm_space_map *sm, void *where_le, size_t max)
 +{
 +	struct sm_disk *smd = container_of(sm, struct sm_disk, sm);
 +	struct disk_sm_root root_le;
 +
 +	root_le.nr_blocks = cpu_to_le64(smd->ll.nr_blocks);
 +	root_le.nr_allocated = cpu_to_le64(smd->ll.nr_allocated);
 +	root_le.bitmap_root = cpu_to_le64(smd->ll.bitmap_root);
 +	root_le.ref_count_root = cpu_to_le64(smd->ll.ref_count_root);
 +
 +	if (max < sizeof(root_le))
 +		return -ENOSPC;
 +
 +	memcpy(where_le, &root_le, sizeof(root_le));
 +
 +	return 0;
 +}
 +
 +/*----------------------------------------------------------------*/
 +
 +static struct dm_space_map ops = {
 +	.destroy = sm_disk_destroy,
 +	.extend = sm_disk_extend,
 +	.get_nr_blocks = sm_disk_get_nr_blocks,
 +	.get_nr_free = sm_disk_get_nr_free,
 +	.get_count = sm_disk_get_count,
 +	.count_is_more_than_one = sm_disk_count_is_more_than_one,
 +	.set_count = sm_disk_set_count,
 +	.inc_block = sm_disk_inc_block,
 +	.dec_block = sm_disk_dec_block,
 +	.new_block = sm_disk_new_block,
 +	.commit = sm_disk_commit,
 +	.root_size = sm_disk_root_size,
 +	.copy_root = sm_disk_copy_root
 +};
 +
 +struct dm_space_map *dm_sm_disk_create(struct dm_transaction_manager *tm,
 +				       dm_block_t nr_blocks)
 +{
 +	int r;
 +	struct sm_disk *smd;
 +
 +	smd = kmalloc(sizeof(*smd), GFP_KERNEL);
 +	if (!smd)
 +		return ERR_PTR(-ENOMEM);
 +
 +	memcpy(&smd->sm, &ops, sizeof(smd->sm));
 +
 +	r = disk_ll_new(&smd->ll, tm);
 +	if (r)
 +		goto bad;
 +
 +	r = disk_ll_extend(&smd->ll, nr_blocks);
 +	if (r)
 +		goto bad;
 +
 +	r = sm_disk_commit(&smd->sm);
 +	if (r)
 +		goto bad;
 +
 +	return &smd->sm;
 +
 +bad:
 +	kfree(smd);
 +	return ERR_PTR(r);
 +}
 +EXPORT_SYMBOL_GPL(dm_sm_disk_create);
 +
 +struct dm_space_map *dm_sm_disk_open(struct dm_transaction_manager *tm,
 +				     void *root_le, size_t len)
 +{
 +	int r;
 +	struct sm_disk *smd;
 +
 +	smd = kmalloc(sizeof(*smd), GFP_KERNEL);
 +	if (!smd)
 +		return ERR_PTR(-ENOMEM);
 +
 +	memcpy(&smd->sm, &ops, sizeof(smd->sm));
 +
 +	r = disk_ll_open(&smd->ll, tm, root_le, len);
 +	if (r)
 +		goto bad;
 +
 +	r = sm_disk_commit(&smd->sm);
 +	if (r)
 +		goto bad;
 +
 +	return &smd->sm;
 +
 +bad:
 +	kfree(smd);
 +	return ERR_PTR(r);
 +}
 +EXPORT_SYMBOL_GPL(dm_sm_disk_open);
diff --cc drivers/md/persistent-data/dm-transaction-manager.c
index be594dd0a12d,000000000000..e58e89ecfd67
mode 100644,000000..100644
--- a/drivers/md/persistent-data/dm-transaction-manager.c
+++ b/drivers/md/persistent-data/dm-transaction-manager.c
@@@ -1,414 -1,0 +1,414 @@@
 +/*
 + * Copyright (C) 2011 Red Hat, Inc. All rights reserved.
 + *
 + * This file is released under the GPL.
 + */
 +#include "dm-transaction-manager.h"
 +#include "dm-space-map.h"
 +#include "dm-space-map-disk.h"
 +#include "dm-space-map-metadata.h"
 +#include "dm-persistent-data-internal.h"
 +
- #include <linux/module.h>
++#include <linux/export.h>
 +#include <linux/slab.h>
 +#include <linux/device-mapper.h>
 +
 +#define DM_MSG_PREFIX "transaction manager"
 +
 +/*----------------------------------------------------------------*/
 +
 +struct shadow_info {
 +	struct hlist_node hlist;
 +	dm_block_t where;
 +};
 +
 +/*
 + * It would be nice if we scaled with the size of transaction.
 + */
 +#define HASH_SIZE 256
 +#define HASH_MASK (HASH_SIZE - 1)
 +
 +struct dm_transaction_manager {
 +	int is_clone;
 +	struct dm_transaction_manager *real;
 +
 +	struct dm_block_manager *bm;
 +	struct dm_space_map *sm;
 +
 +	spinlock_t lock;
 +	struct hlist_head buckets[HASH_SIZE];
 +};
 +
 +/*----------------------------------------------------------------*/
 +
 +static int is_shadow(struct dm_transaction_manager *tm, dm_block_t b)
 +{
 +	int r = 0;
 +	unsigned bucket = dm_hash_block(b, HASH_MASK);
 +	struct shadow_info *si;
 +	struct hlist_node *n;
 +
 +	spin_lock(&tm->lock);
 +
 +	hlist_for_each_entry(si, n, tm->buckets + bucket, hlist)
 +		if (si->where == b) {
 +			r = 1;
 +			break;
 +		}
 +
 +	spin_unlock(&tm->lock);
 +
 +	return r;
 +}
 +
 +/*
 + * This can silently fail if there's no memory.  We're ok with this since
 + * creating redundant shadows causes no harm.
 + */
 +static void insert_shadow(struct dm_transaction_manager *tm, dm_block_t b)
 +{
 +	unsigned bucket;
 +	struct shadow_info *si;
 +
 +	si = kmalloc(sizeof(*si), GFP_NOIO);
 +	if (si) {
 +		si->where = b;
 +		bucket = dm_hash_block(b, HASH_MASK);
 +
 +		spin_lock(&tm->lock);
 +		hlist_add_head(&si->hlist, tm->buckets + bucket);
 +		spin_unlock(&tm->lock);
 +	}
 +}
 +
 +static void wipe_shadow_table(struct dm_transaction_manager *tm)
 +{
 +	struct shadow_info *si;
 +	struct hlist_node *n, *tmp;
 +	struct hlist_head *bucket;
 +	int i;
 +
 +	spin_lock(&tm->lock);
 +	for (i = 0; i < HASH_SIZE; i++) {
 +		bucket = tm->buckets + i;
 +		hlist_for_each_entry_safe(si, n, tmp, bucket, hlist)
 +			kfree(si);
 +
 +		INIT_HLIST_HEAD(bucket);
 +	}
 +	spin_unlock(&tm->lock);
 +}
 +
 +/*----------------------------------------------------------------*/
 +
 +static struct dm_transaction_manager *dm_tm_create(struct dm_block_manager *bm,
 +						   struct dm_space_map *sm)
 +{
 +	int i;
 +	struct dm_transaction_manager *tm;
 +
 +	tm = kmalloc(sizeof(*tm), GFP_KERNEL);
 +	if (!tm)
 +		return ERR_PTR(-ENOMEM);
 +
 +	tm->is_clone = 0;
 +	tm->real = NULL;
 +	tm->bm = bm;
 +	tm->sm = sm;
 +
 +	spin_lock_init(&tm->lock);
 +	for (i = 0; i < HASH_SIZE; i++)
 +		INIT_HLIST_HEAD(tm->buckets + i);
 +
 +	return tm;
 +}
 +
 +struct dm_transaction_manager *dm_tm_create_non_blocking_clone(struct dm_transaction_manager *real)
 +{
 +	struct dm_transaction_manager *tm;
 +
 +	tm = kmalloc(sizeof(*tm), GFP_KERNEL);
 +	if (tm) {
 +		tm->is_clone = 1;
 +		tm->real = real;
 +	}
 +
 +	return tm;
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_create_non_blocking_clone);
 +
 +void dm_tm_destroy(struct dm_transaction_manager *tm)
 +{
 +	kfree(tm);
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_destroy);
 +
 +int dm_tm_pre_commit(struct dm_transaction_manager *tm)
 +{
 +	int r;
 +
 +	if (tm->is_clone)
 +		return -EWOULDBLOCK;
 +
 +	r = dm_sm_commit(tm->sm);
 +	if (r < 0)
 +		return r;
 +
 +	return 0;
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_pre_commit);
 +
 +int dm_tm_commit(struct dm_transaction_manager *tm, struct dm_block *root)
 +{
 +	if (tm->is_clone)
 +		return -EWOULDBLOCK;
 +
 +	wipe_shadow_table(tm);
 +
 +	return dm_bm_flush_and_unlock(tm->bm, root);
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_commit);
 +
 +int dm_tm_new_block(struct dm_transaction_manager *tm,
 +		    struct dm_block_validator *v,
 +		    struct dm_block **result)
 +{
 +	int r;
 +	dm_block_t new_block;
 +
 +	if (tm->is_clone)
 +		return -EWOULDBLOCK;
 +
 +	r = dm_sm_new_block(tm->sm, &new_block);
 +	if (r < 0)
 +		return r;
 +
 +	r = dm_bm_write_lock_zero(tm->bm, new_block, v, result);
 +	if (r < 0) {
 +		dm_sm_dec_block(tm->sm, new_block);
 +		return r;
 +	}
 +
 +	/*
 +	 * New blocks count as shadows in that they don't need to be
 +	 * shadowed again.
 +	 */
 +	insert_shadow(tm, new_block);
 +
 +	return 0;
 +}
 +
 +static int __shadow_block(struct dm_transaction_manager *tm, dm_block_t orig,
 +			  struct dm_block_validator *v,
 +			  struct dm_block **result, int *inc_children)
 +{
 +	int r;
 +	dm_block_t new;
 +	uint32_t count;
 +	struct dm_block *orig_block;
 +
 +	r = dm_sm_new_block(tm->sm, &new);
 +	if (r < 0)
 +		return r;
 +
 +	r = dm_bm_write_lock_zero(tm->bm, new, v, result);
 +	if (r < 0)
 +		goto bad_dec_block;
 +
 +	r = dm_bm_read_lock(tm->bm, orig, v, &orig_block);
 +	if (r < 0)
 +		goto bad_dec_block;
 +
 +	memcpy(dm_block_data(*result), dm_block_data(orig_block),
 +	       dm_bm_block_size(tm->bm));
 +
 +	r = dm_bm_unlock(orig_block);
 +	if (r < 0)
 +		goto bad_dec_block;
 +
 +	r = dm_sm_get_count(tm->sm, orig, &count);
 +	if (r < 0)
 +		goto bad;
 +
 +	r = dm_sm_dec_block(tm->sm, orig);
 +	if (r < 0)
 +		goto bad;
 +
 +	*inc_children = count > 1;
 +
 +	return 0;
 +
 +bad:
 +	dm_bm_unlock(*result);
 +bad_dec_block:
 +	dm_sm_dec_block(tm->sm, new);
 +
 +	return r;
 +}
 +
 +int dm_tm_shadow_block(struct dm_transaction_manager *tm, dm_block_t orig,
 +		       struct dm_block_validator *v, struct dm_block **result,
 +		       int *inc_children)
 +{
 +	int r, more_than_one;
 +
 +	if (tm->is_clone)
 +		return -EWOULDBLOCK;
 +
 +	if (is_shadow(tm, orig)) {
 +		r = dm_sm_count_is_more_than_one(tm->sm, orig, &more_than_one);
 +		if (r < 0)
 +			return r;
 +
 +		if (!more_than_one) {
 +			*inc_children = 0;
 +			return dm_bm_write_lock(tm->bm, orig, v, result);
 +		}
 +		/* fall through */
 +	}
 +
 +	r = __shadow_block(tm, orig, v, result, inc_children);
 +	if (r < 0)
 +		return r;
 +
 +	insert_shadow(tm, dm_block_location(*result));
 +
 +	return r;
 +}
 +
 +int dm_tm_read_lock(struct dm_transaction_manager *tm, dm_block_t b,
 +		    struct dm_block_validator *v,
 +		    struct dm_block **blk)
 +{
 +	if (tm->is_clone)
 +		return dm_bm_read_try_lock(tm->real->bm, b, v, blk);
 +
 +	return dm_bm_read_lock(tm->bm, b, v, blk);
 +}
 +
 +int dm_tm_unlock(struct dm_transaction_manager *tm, struct dm_block *b)
 +{
 +	return dm_bm_unlock(b);
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_unlock);
 +
 +void dm_tm_inc(struct dm_transaction_manager *tm, dm_block_t b)
 +{
 +	/*
 +	 * The non-blocking clone doesn't support this.
 +	 */
 +	BUG_ON(tm->is_clone);
 +
 +	dm_sm_inc_block(tm->sm, b);
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_inc);
 +
 +void dm_tm_dec(struct dm_transaction_manager *tm, dm_block_t b)
 +{
 +	/*
 +	 * The non-blocking clone doesn't support this.
 +	 */
 +	BUG_ON(tm->is_clone);
 +
 +	dm_sm_dec_block(tm->sm, b);
 +}
 +
 +int dm_tm_ref(struct dm_transaction_manager *tm, dm_block_t b,
 +	      uint32_t *result)
 +{
 +	if (tm->is_clone)
 +		return -EWOULDBLOCK;
 +
 +	return dm_sm_get_count(tm->sm, b, result);
 +}
 +
 +struct dm_block_manager *dm_tm_get_bm(struct dm_transaction_manager *tm)
 +{
 +	return tm->bm;
 +}
 +
 +/*----------------------------------------------------------------*/
 +
 +static int dm_tm_create_internal(struct dm_block_manager *bm,
 +				 dm_block_t sb_location,
 +				 struct dm_block_validator *sb_validator,
 +				 size_t root_offset, size_t root_max_len,
 +				 struct dm_transaction_manager **tm,
 +				 struct dm_space_map **sm,
 +				 struct dm_block **sblock,
 +				 int create)
 +{
 +	int r;
 +
 +	*sm = dm_sm_metadata_init();
 +	if (IS_ERR(*sm))
 +		return PTR_ERR(*sm);
 +
 +	*tm = dm_tm_create(bm, *sm);
 +	if (IS_ERR(*tm)) {
 +		dm_sm_destroy(*sm);
 +		return PTR_ERR(*tm);
 +	}
 +
 +	if (create) {
 +		r = dm_bm_write_lock_zero(dm_tm_get_bm(*tm), sb_location,
 +					  sb_validator, sblock);
 +		if (r < 0) {
 +			DMERR("couldn't lock superblock");
 +			goto bad1;
 +		}
 +
 +		r = dm_sm_metadata_create(*sm, *tm, dm_bm_nr_blocks(bm),
 +					  sb_location);
 +		if (r) {
 +			DMERR("couldn't create metadata space map");
 +			goto bad2;
 +		}
 +
 +	} else {
 +		r = dm_bm_write_lock(dm_tm_get_bm(*tm), sb_location,
 +				     sb_validator, sblock);
 +		if (r < 0) {
 +			DMERR("couldn't lock superblock");
 +			goto bad1;
 +		}
 +
 +		r = dm_sm_metadata_open(*sm, *tm,
 +					dm_block_data(*sblock) + root_offset,
 +					root_max_len);
 +		if (IS_ERR(*sm)) {
 +			DMERR("couldn't open metadata space map");
 +			goto bad2;
 +		}
 +	}
 +
 +	return 0;
 +
 +bad2:
 +	dm_tm_unlock(*tm, *sblock);
 +bad1:
 +	dm_tm_destroy(*tm);
 +	dm_sm_destroy(*sm);
 +	return r;
 +}
 +
 +int dm_tm_create_with_sm(struct dm_block_manager *bm, dm_block_t sb_location,
 +			 struct dm_block_validator *sb_validator,
 +			 struct dm_transaction_manager **tm,
 +			 struct dm_space_map **sm, struct dm_block **sblock)
 +{
 +	return dm_tm_create_internal(bm, sb_location, sb_validator,
 +				     0, 0, tm, sm, sblock, 1);
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_create_with_sm);
 +
 +int dm_tm_open_with_sm(struct dm_block_manager *bm, dm_block_t sb_location,
 +		       struct dm_block_validator *sb_validator,
 +		       size_t root_offset, size_t root_max_len,
 +		       struct dm_transaction_manager **tm,
 +		       struct dm_space_map **sm, struct dm_block **sblock)
 +{
 +	return dm_tm_create_internal(bm, sb_location, sb_validator, root_offset,
 +				     root_max_len, tm, sm, sblock, 0);
 +}
 +EXPORT_SYMBOL_GPL(dm_tm_open_with_sm);
diff --cc drivers/media/common/saa7146_core.c
index f5d53a202344,31e53b6a881a..d6b1cf66042d
--- a/drivers/media/common/saa7146_core.c
+++ b/drivers/media/common/saa7146_core.c
@@@ -18,9 -18,8 +18,10 @@@
      Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  */
  
 +#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
 +
  #include <media/saa7146.h>
+ #include <linux/module.h>
  
  LIST_HEAD(saa7146_devices);
  DEFINE_MUTEX(saa7146_devices_lock);
diff --cc drivers/media/common/saa7146_fops.c
index a92546144eaa,e4547afcfa88..71f8e018e564
--- a/drivers/media/common/saa7146_fops.c
+++ b/drivers/media/common/saa7146_fops.c
@@@ -1,6 -1,5 +1,7 @@@
 +#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
 +
  #include <media/saa7146_vv.h>
+ #include <linux/module.h>
  
  /****************************************************************************/
  /* resource management functions, shamelessly stolen from saa7134 driver */
diff --cc drivers/media/common/saa7146_hlp.c
index 79ad73accb27,c9c6e9a6c31d..bc1f545c95cb
--- a/drivers/media/common/saa7146_hlp.c
+++ b/drivers/media/common/saa7146_hlp.c
@@@ -1,6 -1,5 +1,7 @@@
 +#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
 +
  #include <linux/kernel.h>
+ #include <linux/export.h>
  #include <media/saa7146_vv.h>
  
  static void calculate_output_format_register(struct saa7146_dev* saa, u32 palette, u32* clip_format)
diff --cc drivers/media/common/saa7146_video.c
index 384b358d3037,3a00253fe1ee..ce30533fd972
--- a/drivers/media/common/saa7146_video.c
+++ b/drivers/media/common/saa7146_video.c
@@@ -1,7 -1,6 +1,8 @@@
 +#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
 +
  #include <media/saa7146_vv.h>
  #include <media/v4l2-chip-ident.h>
+ #include <linux/module.h>
  
  static int max_memory = 32;
  
diff --cc drivers/media/dvb/frontends/dibx000_common.c
index 774d507b66cc,977211fec137..43be7238311e
--- a/drivers/media/dvb/frontends/dibx000_common.c
+++ b/drivers/media/dvb/frontends/dibx000_common.c
@@@ -1,5 -1,5 +1,6 @@@
  #include <linux/i2c.h>
 +#include <linux/mutex.h>
+ #include <linux/module.h>
  
  #include "dibx000_common.h"
  
diff --cc drivers/media/video/adp1653.c
index 5914390211ff,c2594948ca3f..12eedf4d515a
--- a/drivers/media/video/adp1653.c
+++ b/drivers/media/video/adp1653.c
@@@ -31,8 -31,8 +31,9 @@@
   */
  
  #include <linux/delay.h>
+ #include <linux/module.h>
  #include <linux/i2c.h>
 +#include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/version.h>
  #include <media/adp1653.h>
diff --cc drivers/mfd/max8997.c
index dc58750bb71b,77032e43af4f..5be53ae9b61c
--- a/drivers/mfd/max8997.c
+++ b/drivers/mfd/max8997.c
@@@ -23,8 -23,8 +23,9 @@@
  
  #include <linux/slab.h>
  #include <linux/i2c.h>
 +#include <linux/interrupt.h>
  #include <linux/pm_runtime.h>
+ #include <linux/module.h>
  #include <linux/mutex.h>
  #include <linux/mfd/core.h>
  #include <linux/mfd/max8997.h>
diff --cc drivers/mfd/wm8400-core.c
index e06ba9440cdb,b49b91eb44ec..36de271ba0e3
--- a/drivers/mfd/wm8400-core.c
+++ b/drivers/mfd/wm8400-core.c
@@@ -19,8 -18,8 +19,9 @@@
  #include <linux/mfd/core.h>
  #include <linux/mfd/wm8400-private.h>
  #include <linux/mfd/wm8400-audio.h>
 +#include <linux/regmap.h>
  #include <linux/slab.h>
+ #include <linux/module.h>
  
  static struct {
  	u16  readable;    /* Mask of readable bits */
diff --cc drivers/mmc/host/sdhci-pci.c
index f8a17f98f3a9,25513262b7d5..31ca4a85d220
--- a/drivers/mmc/host/sdhci-pci.c
+++ b/drivers/mmc/host/sdhci-pci.c
@@@ -21,8 -21,7 +21,9 @@@
  #include <linux/mmc/host.h>
  #include <linux/scatterlist.h>
  #include <linux/io.h>
 +#include <linux/gpio.h>
 +#include <linux/sfi.h>
+ #include <linux/module.h>
  
  #include "sdhci.h"
  
diff --cc drivers/mmc/host/sdhci-tegra.c
index 47cee772f00a,93da9405b4a1..67176afcf2db
--- a/drivers/mmc/host/sdhci-tegra.c
+++ b/drivers/mmc/host/sdhci-tegra.c
@@@ -22,8 -20,9 +22,9 @@@
  #include <linux/gpio.h>
  #include <linux/mmc/card.h>
  #include <linux/mmc/host.h>
+ #include <linux/module.h>
  
 -#include <mach/gpio.h>
 +#include <asm/gpio.h>
  #include <mach/sdhci.h>
  
  #include "sdhci-pltfm.h"
diff --cc drivers/power/max8997_charger.c
index e12b4a2a0be2,11ec2a3ec1e3..36fca3c6b368
--- a/drivers/power/max8997_charger.c
+++ b/drivers/power/max8997_charger.c
@@@ -19,8 -19,8 +19,9 @@@
   * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
   */
  
+ #include <linux/module.h>
  #include <linux/err.h>
 +#include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/platform_device.h>
  #include <linux/power_supply.h>
diff --cc drivers/power/max8998_charger.c
index 6f5ffc3e2f03,e08b8c6e8411..0737302af1d2
--- a/drivers/power/max8998_charger.c
+++ b/drivers/power/max8998_charger.c
@@@ -19,8 -19,8 +19,9 @@@
   * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
   */
  
+ #include <linux/module.h>
  #include <linux/err.h>
 +#include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/platform_device.h>
  #include <linux/power_supply.h>
diff --cc drivers/s390/char/vmur.c
index d291a54acfad,c9782ff042e1..6803b468d06d
--- a/drivers/s390/char/vmur.c
+++ b/drivers/s390/char/vmur.c
@@@ -11,6 -11,8 +11,7 @@@
  #define KMSG_COMPONENT "vmur"
  #define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
  
 -#include <linux/kernel_stat.h>
+ #include <linux/module.h>
  #include <linux/cdev.h>
  #include <linux/slab.h>
  
diff --cc drivers/scsi/libfc/fc_lport.c
index 628f347404f9,f4e4885f71b7..31018a8465ab
--- a/drivers/scsi/libfc/fc_lport.c
+++ b/drivers/scsi/libfc/fc_lport.c
@@@ -88,7 -88,7 +88,8 @@@
   */
  
  #include <linux/timer.h>
 +#include <linux/delay.h>
+ #include <linux/module.h>
  #include <linux/slab.h>
  #include <asm/unaligned.h>
  
diff --cc drivers/staging/iio/industrialio-ring.c
index dce50b1a4ee9,704da4a92653..859961608c99
--- a/drivers/staging/iio/industrialio-ring.c
+++ b/drivers/staging/iio/industrialio-ring.c
@@@ -19,9 -19,9 +19,10 @@@
  #include <linux/cdev.h>
  #include <linux/slab.h>
  #include <linux/poll.h>
+ #include <linux/export.h>
  
  #include "iio.h"
 +#include "iio_core.h"
  #include "ring_generic.h"
  
  /**
diff --cc drivers/video/backlight/ep93xx_bl.c
index b0582917f0c8,00c142c41e84..c74a6f4baa12
--- a/drivers/video/backlight/ep93xx_bl.c
+++ b/drivers/video/backlight/ep93xx_bl.c
@@@ -11,8 -11,9 +11,9 @@@
   * BRIGHT, on the Cirrus EP9307, EP9312, and EP9315 processors.
   */
  
 -
 +#include <linux/module.h>
  #include <linux/platform_device.h>
+ #include <linux/module.h>
  #include <linux/io.h>
  #include <linux/fb.h>
  #include <linux/backlight.h>
diff --cc drivers/video/sh_mobile_lcdcfb.c
index 97ab8bac2494,499d54892017..4636f9dc30b0
--- a/drivers/video/sh_mobile_lcdcfb.c
+++ b/drivers/video/sh_mobile_lcdcfb.c
@@@ -23,8 -23,8 +23,9 @@@
  #include <linux/console.h>
  #include <linux/backlight.h>
  #include <linux/gpio.h>
+ #include <linux/module.h>
  #include <video/sh_mobile_lcdc.h>
 +#include <video/sh_mobile_meram.h>
  #include <linux/atomic.h>
  
  #include "sh_mobile_lcdcfb.h"
diff --cc drivers/xen/xen-selfballoon.c
index 6ea852e25162,9172e10790c9..e21e3cee68fa
--- a/drivers/xen/xen-selfballoon.c
+++ b/drivers/xen/xen-selfballoon.c
@@@ -68,9 -68,10 +68,11 @@@
   */
  
  #include <linux/kernel.h>
+ #include <linux/stat.h>
+ #include <linux/module.h>
  #include <linux/mm.h>
  #include <linux/mman.h>
 +#include <linux/module.h>
  #include <linux/workqueue.h>
  #include <xen/balloon.h>
  #include <xen/tmem.h>
diff --cc include/linux/dmaengine.h
index ace51af4369f,1ceff5ae9d31..75f53f874b24
--- a/include/linux/dmaengine.h
+++ b/include/linux/dmaengine.h
@@@ -24,8 -24,11 +24,10 @@@
  #include <linux/device.h>
  #include <linux/uio.h>
  #include <linux/dma-direction.h>
 +#include <linux/scatterlist.h>
+ #include <linux/bitmap.h>
+ #include <asm/page.h>
  
 -struct scatterlist;
 -
  /**
   * typedef dma_cookie_t - an opaque DMA cookie
   *
diff --cc kernel/rcupdate.c
index 1a491edd9c09,3c82e32d67f9..f63ea4022d78
--- a/kernel/rcupdate.c
+++ b/kernel/rcupdate.c
@@@ -43,14 -43,9 +43,14 @@@
  #include <linux/notifier.h>
  #include <linux/cpu.h>
  #include <linux/mutex.h>
- #include <linux/module.h>
+ #include <linux/export.h>
  #include <linux/hardirq.h>
  
 +#define CREATE_TRACE_POINTS
 +#include <trace/events/rcu.h>
 +
 +#include "rcu.h"
 +
  #ifdef CONFIG_DEBUG_LOCK_ALLOC
  static struct lock_class_key rcu_lock_key;
  struct lockdep_map rcu_lock_map =
diff --cc sound/usb/6fire/firmware.c
index 07bcfe4d18a7,3ebbdec2a464..3b5f517a3972
--- a/sound/usb/6fire/firmware.c
+++ b/sound/usb/6fire/firmware.c
@@@ -15,8 -15,8 +15,9 @@@
   */
  
  #include <linux/firmware.h>
+ #include <linux/module.h>
  #include <linux/bitrev.h>
 +#include <linux/kernel.h>
  
  #include "firmware.h"
  #include "chip.h"