diff options
author | Ulf Samuelsson <ulf.samuelsson@atmel.com> | 2007-08-16 06:26:25 +0000 |
---|---|---|
committer | Ulf Samuelsson <ulf.samuelsson@atmel.com> | 2007-08-16 06:26:25 +0000 |
commit | 18199aa7b69102c99c5b6c2382f039823c781e3b (patch) | |
tree | b33c03f416d0bb7448a1da5a27241ef088c19384 /toolchain/kernel-headers/lzma/linux-2.6.21.5-001-lzma-vmlinuz.00.patch | |
parent | c6771dfb847e53f8f5c184fad407cce599857ec9 (diff) | |
download | buildroot-novena-18199aa7b69102c99c5b6c2382f039823c781e3b.tar.gz buildroot-novena-18199aa7b69102c99c5b6c2382f039823c781e3b.zip |
Move lzma patches to toolchain/kernel-headers/lzma
They will be applied ONLY if BR2_KERNEL_HEADERS_LZMA is set.
BR2_KERNEL_HEADERS_LZMA defaults to NO, so the user
has to actively set this config flag if lzma is needed.
This means that the default behaviour of buildroot will work
for most users.
Comment from author:
[Brad House]
I find myself having to remove the lzma patches because my build system
doesn't natively have lzma. I tried to compensate for this by
installing the latest lzma from gentoo's package tree, and apparently,
it accepts different flags than the one these patches expect, so my
kernel build still fails. Finally, I used the lzma from this buildroot
and compiled it by hand, and it _mostly_ worked. Regardless, it seems
silly to make this a requirement. Personally, I gzip my initramfs,
and that's enough compression for me...
Diffstat (limited to 'toolchain/kernel-headers/lzma/linux-2.6.21.5-001-lzma-vmlinuz.00.patch')
-rw-r--r-- | toolchain/kernel-headers/lzma/linux-2.6.21.5-001-lzma-vmlinuz.00.patch | 27017 |
1 files changed, 27017 insertions, 0 deletions
diff --git a/toolchain/kernel-headers/lzma/linux-2.6.21.5-001-lzma-vmlinuz.00.patch b/toolchain/kernel-headers/lzma/linux-2.6.21.5-001-lzma-vmlinuz.00.patch new file mode 100644 index 000000000..87e50f8be --- /dev/null +++ b/toolchain/kernel-headers/lzma/linux-2.6.21.5-001-lzma-vmlinuz.00.patch @@ -0,0 +1,27017 @@ +diff --git a/.miniconfig b/.miniconfig +new file mode 100644 +index 0000000..5686e53 +--- /dev/null ++++ b/.miniconfig +@@ -0,0 +1,89 @@ ++#make allnoconfig KCONFIG_ALLCONFIG=miniconfig ++CONFIG_X86_32=y ++CONFIG_CLOCKSOURCE_WATCHDOG=y ++CONFIG_LOCKDEP_SUPPORT=y ++CONFIG_SEMAPHORE_SLEEPERS=y ++CONFIG_MMU=y ++CONFIG_GENERIC_ISA_DMA=y ++CONFIG_GENERIC_HWEIGHT=y ++CONFIG_DMI=y ++CONFIG_INIT_ENV_ARG_LIMIT=32 ++CONFIG_IKCONFIG=y ++CONFIG_IKCONFIG_PROC=y ++CONFIG_SYSFS_DEPRECATED=y ++CONFIG_BLK_DEV_INITRD=y ++CONFIG_SYSCTL=y ++CONFIG_EMBEDDED=y ++CONFIG_PRINTK=y ++CONFIG_BASE_SMALL=1 ++CONFIG_BLOCK=y ++CONFIG_IOSCHED_NOOP=y ++CONFIG_DEFAULT_IOSCHED="noop" ++CONFIG_X86_GENERIC=y ++CONFIG_X86_L1_CACHE_SHIFT=7 ++CONFIG_GENERIC_CALIBRATE_DELAY=y ++CONFIG_X86_WP_WORKS_OK=y ++CONFIG_X86_BSWAP=y ++CONFIG_X86_CMPXCHG64=y ++CONFIG_X86_INTEL_USERCOPY=y ++CONFIG_X86_TSC=y ++CONFIG_PREEMPT_NONE=y ++CONFIG_VM86=y ++CONFIG_HIGHMEM=y ++CONFIG_FLATMEM=y ++CONFIG_MTRR=y ++CONFIG_HZ_250=y ++CONFIG_PHYSICAL_ALIGN=0x100000 ++CONFIG_ARCH_ENABLE_MEMORY_HOTPLUG=y ++CONFIG_PM=y ++CONFIG_ACPI=y ++CONFIG_ACPI_SLEEP=y ++CONFIG_ACPI_BLACKLIST_YEAR=0 ++CONFIG_ACPI_EC=y ++CONFIG_ACPI_SYSTEM=y ++CONFIG_PCI=y ++CONFIG_PCI_GOANY=y ++CONFIG_PCI_DIRECT=y ++CONFIG_BINFMT_ELF=y ++CONFIG_STANDALONE=y ++CONFIG_BLK_DEV_LOOP=y ++CONFIG_IDE=y ++CONFIG_IDE_MAX_HWIFS=2 ++CONFIG_BLK_DEV_IDE=y ++CONFIG_BLK_DEV_IDEDISK=y ++CONFIG_IDEDISK_MULTI_MODE=y ++CONFIG_BLK_DEV_IDECD=y ++CONFIG_IDE_GENERIC=y ++CONFIG_INPUT_MOUSEDEV=y ++CONFIG_INPUT_MOUSEDEV_SCREEN_X=1024 ++CONFIG_INPUT_KEYBOARD=y ++CONFIG_KEYBOARD_ATKBD=y ++CONFIG_SERIO=y ++CONFIG_VT=y ++CONFIG_VT_CONSOLE=y ++CONFIG_UNIX98_PTYS=y ++CONFIG_VGA_CONSOLE=y ++CONFIG_USB_ARCH_HAS_HCD=y ++CONFIG_USB_ARCH_HAS_EHCI=y ++CONFIG_EXT2_FS=y ++CONFIG_DNOTIFY=y ++CONFIG_ISO9660_FS=y ++CONFIG_FAT_FS=y ++CONFIG_VFAT_FS=y ++CONFIG_FAT_DEFAULT_IOCHARSET="iso8859-1" ++CONFIG_PROC_FS=y ++CONFIG_PROC_SYSCTL=y ++CONFIG_SYSFS=y ++CONFIG_RAMFS=y ++CONFIG_SQUASHFS=y ++CONFIG_SQUASHFS_FRAGMENT_CACHE_SIZE=3 ++CONFIG_MSDOS_PARTITION=y ++CONFIG_NLS_DEFAULT="iso8859-1" ++CONFIG_AUFS=y ++CONFIG_AUFS_FAKE_DM=y ++CONFIG_EARLY_PRINTK=y ++CONFIG_DOUBLEFAULT=y ++CONFIG_ZLIB_INFLATE=y ++CONFIG_HAS_IOPORT=y ++CONFIG_GENERIC_IRQ_PROBE=y ++CONFIG_KTIME_SCALAR=y +diff --git a/Makefile b/Makefile +index d970cb1..a369204 100644 +--- a/Makefile ++++ b/Makefile +@@ -188,7 +188,7 @@ CROSS_COMPILE ?= + # Architecture as present in compile.h + UTS_MACHINE := $(ARCH) + +-KCONFIG_CONFIG ?= .config ++KCONFIG_CONFIG ?= .miniconfig + + # SHELL used by kbuild + CONFIG_SHELL := $(shell if [ -x "$$BASH" ]; then echo $$BASH; \ +diff --git a/arch/i386/boot/compressed/LzmaDecode.c b/arch/i386/boot/compressed/LzmaDecode.c +new file mode 100644 +index 0000000..21bf40b +--- /dev/null ++++ b/arch/i386/boot/compressed/LzmaDecode.c +@@ -0,0 +1,588 @@ ++/* ++ LzmaDecode.c ++ LZMA Decoder (optimized for Speed version) ++ ++ LZMA SDK 4.22 Copyright (c) 1999-2005 Igor Pavlov (2005-06-10) ++ http://www.7-zip.org/ ++ ++ LZMA SDK is licensed under two licenses: ++ 1) GNU Lesser General Public License (GNU LGPL) ++ 2) Common Public License (CPL) ++ It means that you can select one of these two licenses and ++ follow rules of that license. ++ ++ SPECIAL EXCEPTION: ++ Igor Pavlov, as the author of this Code, expressly permits you to ++ statically or dynamically link your Code (or bind by name) to the ++ interfaces of this file without subjecting your linked Code to the ++ terms of the CPL or GNU LGPL. Any modifications or additions ++ to this file, however, are subject to the LGPL or CPL terms. ++*/ ++ ++#include "LzmaDecode.h" ++ ++#ifndef Byte ++#define Byte unsigned char ++#endif ++ ++#define kNumTopBits 24 ++#define kTopValue ((UInt32)1 << kNumTopBits) ++ ++#define kNumBitModelTotalBits 11 ++#define kBitModelTotal (1 << kNumBitModelTotalBits) ++#define kNumMoveBits 5 ++ ++#define RC_READ_BYTE (*Buffer++) ++ ++#define RC_INIT2 Code = 0; Range = 0xFFFFFFFF; \ ++ { int i; for(i = 0; i < 5; i++) { RC_TEST; Code = (Code << 8) | RC_READ_BYTE; }} ++ ++#ifdef _LZMA_IN_CB ++ ++#define RC_TEST { if (Buffer == BufferLim) \ ++ { SizeT size; int result = InCallback->Read(InCallback, &Buffer, &size); if (result != LZMA_RESULT_OK) return result; \ ++ BufferLim = Buffer + size; if (size == 0) return LZMA_RESULT_DATA_ERROR; }} ++ ++#define RC_INIT Buffer = BufferLim = 0; RC_INIT2 ++ ++#else ++ ++#define RC_TEST { if (Buffer == BufferLim) return LZMA_RESULT_DATA_ERROR; } ++ ++#define RC_INIT(buffer, bufferSize) Buffer = buffer; BufferLim = buffer + bufferSize; RC_INIT2 ++ ++#endif ++ ++#define RC_NORMALIZE if (Range < kTopValue) { RC_TEST; Range <<= 8; Code = (Code << 8) | RC_READ_BYTE; } ++ ++#define IfBit0(p) RC_NORMALIZE; bound = (Range >> kNumBitModelTotalBits) * *(p); if (Code < bound) ++#define UpdateBit0(p) Range = bound; *(p) += (kBitModelTotal - *(p)) >> kNumMoveBits; ++#define UpdateBit1(p) Range -= bound; Code -= bound; *(p) -= (*(p)) >> kNumMoveBits; ++ ++#define RC_GET_BIT2(p, mi, A0, A1) IfBit0(p) \ ++ { UpdateBit0(p); mi <<= 1; A0; } else \ ++ { UpdateBit1(p); mi = (mi + mi) + 1; A1; } ++ ++#define RC_GET_BIT(p, mi) RC_GET_BIT2(p, mi, ; , ;) ++ ++#define RangeDecoderBitTreeDecode(probs, numLevels, res) \ ++ { int i = numLevels; res = 1; \ ++ do { CProb *p = probs + res; RC_GET_BIT(p, res) } while(--i != 0); \ ++ res -= (1 << numLevels); } ++ ++ ++#define kNumPosBitsMax 4 ++#define kNumPosStatesMax (1 << kNumPosBitsMax) ++ ++#define kLenNumLowBits 3 ++#define kLenNumLowSymbols (1 << kLenNumLowBits) ++#define kLenNumMidBits 3 ++#define kLenNumMidSymbols (1 << kLenNumMidBits) ++#define kLenNumHighBits 8 ++#define kLenNumHighSymbols (1 << kLenNumHighBits) ++ ++#define LenChoice 0 ++#define LenChoice2 (LenChoice + 1) ++#define LenLow (LenChoice2 + 1) ++#define LenMid (LenLow + (kNumPosStatesMax << kLenNumLowBits)) ++#define LenHigh (LenMid + (kNumPosStatesMax << kLenNumMidBits)) ++#define kNumLenProbs (LenHigh + kLenNumHighSymbols) ++ ++ ++#define kNumStates 12 ++#define kNumLitStates 7 ++ ++#define kStartPosModelIndex 4 ++#define kEndPosModelIndex 14 ++#define kNumFullDistances (1 << (kEndPosModelIndex >> 1)) ++ ++#define kNumPosSlotBits 6 ++#define kNumLenToPosStates 4 ++ ++#define kNumAlignBits 4 ++#define kAlignTableSize (1 << kNumAlignBits) ++ ++#define kMatchMinLen 2 ++ ++#define IsMatch 0 ++#define IsRep (IsMatch + (kNumStates << kNumPosBitsMax)) ++#define IsRepG0 (IsRep + kNumStates) ++#define IsRepG1 (IsRepG0 + kNumStates) ++#define IsRepG2 (IsRepG1 + kNumStates) ++#define IsRep0Long (IsRepG2 + kNumStates) ++#define PosSlot (IsRep0Long + (kNumStates << kNumPosBitsMax)) ++#define SpecPos (PosSlot + (kNumLenToPosStates << kNumPosSlotBits)) ++#define Align (SpecPos + kNumFullDistances - kEndPosModelIndex) ++#define LenCoder (Align + kAlignTableSize) ++#define RepLenCoder (LenCoder + kNumLenProbs) ++#define Literal (RepLenCoder + kNumLenProbs) ++ ++#if Literal != LZMA_BASE_SIZE ++StopCompilingDueBUG ++#endif ++ ++int LzmaDecodeProperties(CLzmaProperties *propsRes, const unsigned char *propsData, int size) ++{ ++ unsigned char prop0; ++ if (size < LZMA_PROPERTIES_SIZE) ++ return LZMA_RESULT_DATA_ERROR; ++ prop0 = propsData[0]; ++ if (prop0 >= (9 * 5 * 5)) ++ return LZMA_RESULT_DATA_ERROR; ++ { ++ for (propsRes->pb = 0; prop0 >= (9 * 5); propsRes->pb++, prop0 -= (9 * 5)); ++ for (propsRes->lp = 0; prop0 >= 9; propsRes->lp++, prop0 -= 9); ++ propsRes->lc = prop0; ++ /* ++ unsigned char remainder = (unsigned char)(prop0 / 9); ++ propsRes->lc = prop0 % 9; ++ propsRes->pb = remainder / 5; ++ propsRes->lp = remainder % 5; ++ */ ++ } ++ ++ #ifdef _LZMA_OUT_READ ++ { ++ int i; ++ propsRes->DictionarySize = 0; ++ for (i = 0; i < 4; i++) ++ propsRes->DictionarySize += (UInt32)(propsData[1 + i]) << (i * 8); ++ if (propsRes->DictionarySize == 0) ++ propsRes->DictionarySize = 1; ++ } ++ #endif ++ return LZMA_RESULT_OK; ++} ++ ++#define kLzmaStreamWasFinishedId (-1) ++ ++int LzmaDecode(CLzmaDecoderState *vs, ++ #ifdef _LZMA_IN_CB ++ ILzmaInCallback *InCallback, ++ #else ++ const unsigned char *inStream, SizeT inSize, SizeT *inSizeProcessed, ++ #endif ++ unsigned char *outStream, SizeT outSize, SizeT *outSizeProcessed) ++{ ++ CProb *p = vs->Probs; ++ SizeT nowPos = 0; ++ Byte previousByte = 0; ++ UInt32 posStateMask = (1 << (vs->Properties.pb)) - 1; ++ UInt32 literalPosMask = (1 << (vs->Properties.lp)) - 1; ++ int lc = vs->Properties.lc; ++ ++ #ifdef _LZMA_OUT_READ ++ ++ UInt32 Range = vs->Range; ++ UInt32 Code = vs->Code; ++ #ifdef _LZMA_IN_CB ++ const Byte *Buffer = vs->Buffer; ++ const Byte *BufferLim = vs->BufferLim; ++ #else ++ const Byte *Buffer = inStream; ++ const Byte *BufferLim = inStream + inSize; ++ #endif ++ int state = vs->State; ++ UInt32 rep0 = vs->Reps[0], rep1 = vs->Reps[1], rep2 = vs->Reps[2], rep3 = vs->Reps[3]; ++ int len = vs->RemainLen; ++ UInt32 globalPos = vs->GlobalPos; ++ UInt32 distanceLimit = vs->DistanceLimit; ++ ++ Byte *dictionary = vs->Dictionary; ++ UInt32 dictionarySize = vs->Properties.DictionarySize; ++ UInt32 dictionaryPos = vs->DictionaryPos; ++ ++ Byte tempDictionary[4]; ++ ++ #ifndef _LZMA_IN_CB ++ *inSizeProcessed = 0; ++ #endif ++ *outSizeProcessed = 0; ++ if (len == kLzmaStreamWasFinishedId) ++ return LZMA_RESULT_OK; ++ ++ if (dictionarySize == 0) ++ { ++ dictionary = tempDictionary; ++ dictionarySize = 1; ++ tempDictionary[0] = vs->TempDictionary[0]; ++ } ++ ++ if (len == kLzmaNeedInitId) ++ { ++ { ++ UInt32 numProbs = Literal + ((UInt32)LZMA_LIT_SIZE << (lc + vs->Properties.lp)); ++ UInt32 i; ++ for (i = 0; i < numProbs; i++) ++ p[i] = kBitModelTotal >> 1; ++ rep0 = rep1 = rep2 = rep3 = 1; ++ state = 0; ++ globalPos = 0; ++ distanceLimit = 0; ++ dictionaryPos = 0; ++ dictionary[dictionarySize - 1] = 0; ++ #ifdef _LZMA_IN_CB ++ RC_INIT; ++ #else ++ RC_INIT(inStream, inSize); ++ #endif ++ } ++ len = 0; ++ } ++ while(len != 0 && nowPos < outSize) ++ { ++ UInt32 pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ outStream[nowPos++] = dictionary[dictionaryPos] = dictionary[pos]; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ len--; ++ } ++ if (dictionaryPos == 0) ++ previousByte = dictionary[dictionarySize - 1]; ++ else ++ previousByte = dictionary[dictionaryPos - 1]; ++ ++ #else /* if !_LZMA_OUT_READ */ ++ ++ int state = 0; ++ UInt32 rep0 = 1, rep1 = 1, rep2 = 1, rep3 = 1; ++ int len = 0; ++ const Byte *Buffer; ++ const Byte *BufferLim; ++ UInt32 Range; ++ UInt32 Code; ++ ++ #ifndef _LZMA_IN_CB ++ *inSizeProcessed = 0; ++ #endif ++ *outSizeProcessed = 0; ++ ++ { ++ UInt32 i; ++ UInt32 numProbs = Literal + ((UInt32)LZMA_LIT_SIZE << (lc + vs->Properties.lp)); ++ for (i = 0; i < numProbs; i++) ++ p[i] = kBitModelTotal >> 1; ++ } ++ ++ #ifdef _LZMA_IN_CB ++ RC_INIT; ++ #else ++ RC_INIT(inStream, inSize); ++ #endif ++ ++ #endif /* _LZMA_OUT_READ */ ++ ++ while(nowPos < outSize) ++ { ++ CProb *prob; ++ UInt32 bound; ++ int posState = (int)( ++ (nowPos ++ #ifdef _LZMA_OUT_READ ++ + globalPos ++ #endif ++ ) ++ & posStateMask); ++ ++ prob = p + IsMatch + (state << kNumPosBitsMax) + posState; ++ IfBit0(prob) ++ { ++ int symbol = 1; ++ UpdateBit0(prob) ++ prob = p + Literal + (LZMA_LIT_SIZE * ++ ((( ++ (nowPos ++ #ifdef _LZMA_OUT_READ ++ + globalPos ++ #endif ++ ) ++ & literalPosMask) << lc) + (previousByte >> (8 - lc)))); ++ ++ if (state >= kNumLitStates) ++ { ++ int matchByte; ++ #ifdef _LZMA_OUT_READ ++ UInt32 pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ matchByte = dictionary[pos]; ++ #else ++ matchByte = outStream[nowPos - rep0]; ++ #endif ++ do ++ { ++ int bit; ++ CProb *probLit; ++ matchByte <<= 1; ++ bit = (matchByte & 0x100); ++ probLit = prob + 0x100 + bit + symbol; ++ RC_GET_BIT2(probLit, symbol, if (bit != 0) break, if (bit == 0) break) ++ } ++ while (symbol < 0x100); ++ } ++ while (symbol < 0x100) ++ { ++ CProb *probLit = prob + symbol; ++ RC_GET_BIT(probLit, symbol) ++ } ++ previousByte = (Byte)symbol; ++ ++ outStream[nowPos++] = previousByte; ++ #ifdef _LZMA_OUT_READ ++ if (distanceLimit < dictionarySize) ++ distanceLimit++; ++ ++ dictionary[dictionaryPos] = previousByte; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ #endif ++ if (state < 4) state = 0; ++ else if (state < 10) state -= 3; ++ else state -= 6; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ prob = p + IsRep + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ rep3 = rep2; ++ rep2 = rep1; ++ rep1 = rep0; ++ state = state < kNumLitStates ? 0 : 3; ++ prob = p + LenCoder; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ prob = p + IsRepG0 + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ prob = p + IsRep0Long + (state << kNumPosBitsMax) + posState; ++ IfBit0(prob) ++ { ++ #ifdef _LZMA_OUT_READ ++ UInt32 pos; ++ #endif ++ UpdateBit0(prob); ++ ++ #ifdef _LZMA_OUT_READ ++ if (distanceLimit == 0) ++ #else ++ if (nowPos == 0) ++ #endif ++ return LZMA_RESULT_DATA_ERROR; ++ ++ state = state < kNumLitStates ? 9 : 11; ++ #ifdef _LZMA_OUT_READ ++ pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ previousByte = dictionary[pos]; ++ dictionary[dictionaryPos] = previousByte; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ #else ++ previousByte = outStream[nowPos - rep0]; ++ #endif ++ outStream[nowPos++] = previousByte; ++ #ifdef _LZMA_OUT_READ ++ if (distanceLimit < dictionarySize) ++ distanceLimit++; ++ #endif ++ ++ continue; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ } ++ } ++ else ++ { ++ UInt32 distance; ++ UpdateBit1(prob); ++ prob = p + IsRepG1 + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ distance = rep1; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ prob = p + IsRepG2 + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ distance = rep2; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ distance = rep3; ++ rep3 = rep2; ++ } ++ rep2 = rep1; ++ } ++ rep1 = rep0; ++ rep0 = distance; ++ } ++ state = state < kNumLitStates ? 8 : 11; ++ prob = p + RepLenCoder; ++ } ++ { ++ int numBits, offset; ++ CProb *probLen = prob + LenChoice; ++ IfBit0(probLen) ++ { ++ UpdateBit0(probLen); ++ probLen = prob + LenLow + (posState << kLenNumLowBits); ++ offset = 0; ++ numBits = kLenNumLowBits; ++ } ++ else ++ { ++ UpdateBit1(probLen); ++ probLen = prob + LenChoice2; ++ IfBit0(probLen) ++ { ++ UpdateBit0(probLen); ++ probLen = prob + LenMid + (posState << kLenNumMidBits); ++ offset = kLenNumLowSymbols; ++ numBits = kLenNumMidBits; ++ } ++ else ++ { ++ UpdateBit1(probLen); ++ probLen = prob + LenHigh; ++ offset = kLenNumLowSymbols + kLenNumMidSymbols; ++ numBits = kLenNumHighBits; ++ } ++ } ++ RangeDecoderBitTreeDecode(probLen, numBits, len); ++ len += offset; ++ } ++ ++ if (state < 4) ++ { ++ int posSlot; ++ state += kNumLitStates; ++ prob = p + PosSlot + ++ ((len < kNumLenToPosStates ? len : kNumLenToPosStates - 1) << ++ kNumPosSlotBits); ++ RangeDecoderBitTreeDecode(prob, kNumPosSlotBits, posSlot); ++ if (posSlot >= kStartPosModelIndex) ++ { ++ int numDirectBits = ((posSlot >> 1) - 1); ++ rep0 = (2 | ((UInt32)posSlot & 1)); ++ if (posSlot < kEndPosModelIndex) ++ { ++ rep0 <<= numDirectBits; ++ prob = p + SpecPos + rep0 - posSlot - 1; ++ } ++ else ++ { ++ numDirectBits -= kNumAlignBits; ++ do ++ { ++ RC_NORMALIZE ++ Range >>= 1; ++ rep0 <<= 1; ++ if (Code >= Range) ++ { ++ Code -= Range; ++ rep0 |= 1; ++ } ++ } ++ while (--numDirectBits != 0); ++ prob = p + Align; ++ rep0 <<= kNumAlignBits; ++ numDirectBits = kNumAlignBits; ++ } ++ { ++ int i = 1; ++ int mi = 1; ++ do ++ { ++ CProb *prob3 = prob + mi; ++ RC_GET_BIT2(prob3, mi, ; , rep0 |= i); ++ i <<= 1; ++ } ++ while(--numDirectBits != 0); ++ } ++ } ++ else ++ rep0 = posSlot; ++ if (++rep0 == (UInt32)(0)) ++ { ++ /* it's for stream version */ ++ len = kLzmaStreamWasFinishedId; ++ break; ++ } ++ } ++ ++ len += kMatchMinLen; ++ #ifdef _LZMA_OUT_READ ++ if (rep0 > distanceLimit) ++ #else ++ if (rep0 > nowPos) ++ #endif ++ return LZMA_RESULT_DATA_ERROR; ++ ++ #ifdef _LZMA_OUT_READ ++ if (dictionarySize - distanceLimit > (UInt32)len) ++ distanceLimit += len; ++ else ++ distanceLimit = dictionarySize; ++ #endif ++ ++ do ++ { ++ #ifdef _LZMA_OUT_READ ++ UInt32 pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ previousByte = dictionary[pos]; ++ dictionary[dictionaryPos] = previousByte; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ #else ++ previousByte = outStream[nowPos - rep0]; ++ #endif ++ len--; ++ outStream[nowPos++] = previousByte; ++ } ++ while(len != 0 && nowPos < outSize); ++ } ++ } ++ RC_NORMALIZE; ++ ++ #ifdef _LZMA_OUT_READ ++ vs->Range = Range; ++ vs->Code = Code; ++ vs->DictionaryPos = dictionaryPos; ++ vs->GlobalPos = globalPos + (UInt32)nowPos; ++ vs->DistanceLimit = distanceLimit; ++ vs->Reps[0] = rep0; ++ vs->Reps[1] = rep1; ++ vs->Reps[2] = rep2; ++ vs->Reps[3] = rep3; ++ vs->State = state; ++ vs->RemainLen = len; ++ vs->TempDictionary[0] = tempDictionary[0]; ++ #endif ++ ++ #ifdef _LZMA_IN_CB ++ vs->Buffer = Buffer; ++ vs->BufferLim = BufferLim; ++ #else ++ *inSizeProcessed = (SizeT)(Buffer - inStream); ++ #endif ++ *outSizeProcessed = nowPos; ++ return LZMA_RESULT_OK; ++} +diff --git a/arch/i386/boot/compressed/LzmaDecode.h b/arch/i386/boot/compressed/LzmaDecode.h +new file mode 100644 +index 0000000..213062a +--- /dev/null ++++ b/arch/i386/boot/compressed/LzmaDecode.h +@@ -0,0 +1,131 @@ ++/* ++ LzmaDecode.h ++ LZMA Decoder interface ++ ++ LZMA SDK 4.21 Copyright (c) 1999-2005 Igor Pavlov (2005-06-08) ++ http://www.7-zip.org/ ++ ++ LZMA SDK is licensed under two licenses: ++ 1) GNU Lesser General Public License (GNU LGPL) ++ 2) Common Public License (CPL) ++ It means that you can select one of these two licenses and ++ follow rules of that license. ++ ++ SPECIAL EXCEPTION: ++ Igor Pavlov, as the author of this code, expressly permits you to ++ statically or dynamically link your code (or bind by name) to the ++ interfaces of this file without subjecting your linked code to the ++ terms of the CPL or GNU LGPL. Any modifications or additions ++ to this file, however, are subject to the LGPL or CPL terms. ++*/ ++ ++#ifndef __LZMADECODE_H ++#define __LZMADECODE_H ++ ++/* #define _LZMA_IN_CB */ ++/* Use callback for input data */ ++ ++/* #define _LZMA_OUT_READ */ ++/* Use read function for output data */ ++ ++/* #define _LZMA_PROB32 */ ++/* It can increase speed on some 32-bit CPUs, ++ but memory usage will be doubled in that case */ ++ ++/* #define _LZMA_LOC_OPT */ ++/* Enable local speed optimizations inside code */ ++ ++/* #define _LZMA_SYSTEM_SIZE_T */ ++/* Use system's size_t. You can use it to enable 64-bit sizes supporting*/ ++ ++#ifndef UInt32 ++#ifdef _LZMA_UINT32_IS_ULONG ++#define UInt32 unsigned long ++#else ++#define UInt32 unsigned int ++#endif ++#endif ++ ++#ifndef SizeT ++#ifdef _LZMA_SYSTEM_SIZE_T ++#include <stddef.h> ++#define SizeT size_t ++#else ++#define SizeT UInt32 ++#endif ++#endif ++ ++#ifdef _LZMA_PROB32 ++#define CProb UInt32 ++#else ++#define CProb unsigned short ++#endif ++ ++#define LZMA_RESULT_OK 0 ++#define LZMA_RESULT_DATA_ERROR 1 ++ ++#ifdef _LZMA_IN_CB ++typedef struct _ILzmaInCallback ++{ ++ int (*Read)(void *object, const unsigned char **buffer, SizeT *bufferSize); ++} ILzmaInCallback; ++#endif ++ ++#define LZMA_BASE_SIZE 1846 ++#define LZMA_LIT_SIZE 768 ++ ++#define LZMA_PROPERTIES_SIZE 5 ++ ++typedef struct _CLzmaProperties ++{ ++ int lc; ++ int lp; ++ int pb; ++ #ifdef _LZMA_OUT_READ ++ UInt32 DictionarySize; ++ #endif ++}CLzmaProperties; ++ ++int LzmaDecodeProperties(CLzmaProperties *propsRes, const unsigned char *propsData, int size); ++ ++#define LzmaGetNumProbs(Properties) (LZMA_BASE_SIZE + (LZMA_LIT_SIZE << ((Properties)->lc + (Properties)->lp))) ++ ++#define kLzmaNeedInitId (-2) ++ ++typedef struct _CLzmaDecoderState ++{ ++ CLzmaProperties Properties; ++ CProb *Probs; ++ ++ #ifdef _LZMA_IN_CB ++ const unsigned char *Buffer; ++ const unsigned char *BufferLim; ++ #endif ++ ++ #ifdef _LZMA_OUT_READ ++ unsigned char *Dictionary; ++ UInt32 Range; ++ UInt32 Code; ++ UInt32 DictionaryPos; ++ UInt32 GlobalPos; ++ UInt32 DistanceLimit; ++ UInt32 Reps[4]; ++ int State; ++ int RemainLen; ++ unsigned char TempDictionary[4]; ++ #endif ++} CLzmaDecoderState; ++ ++#ifdef _LZMA_OUT_READ ++#define LzmaDecoderInit(vs) { (vs)->RemainLen = kLzmaNeedInitId; } ++#endif ++ ++int LzmaDecode(CLzmaDecoderState *vs, ++ #ifdef _LZMA_IN_CB ++ ILzmaInCallback *inCallback, ++ #else ++ const unsigned char *inStream, SizeT inSize, SizeT *inSizeProcessed, ++ #endif ++ unsigned char *outStream, SizeT outSize, SizeT *outSizeProcessed); ++ ++#endif +diff --git a/arch/i386/boot/compressed/Makefile b/arch/i386/boot/compressed/Makefile +index a661217..fb40869 100644 +--- a/arch/i386/boot/compressed/Makefile ++++ b/arch/i386/boot/compressed/Makefile +@@ -4,15 +4,16 @@ + # create a compressed vmlinux image from the original vmlinux + # + +-targets := vmlinux vmlinux.bin vmlinux.bin.gz head.o misc.o piggy.o \ +- vmlinux.bin.all vmlinux.relocs ++tragets := head.o lzma_misc.o piggy.o \ ++ vmlinux.bin.all vmlinux.relocs \ ++ vmlinux vmlinux.bin vmlinux.bin.gz + EXTRA_AFLAGS := -traditional + + LDFLAGS_vmlinux := -T +-CFLAGS_misc.o += -fPIC ++CFLAGS_lzma_misc.o += -fPIC + hostprogs-y := relocs + +-$(obj)/vmlinux: $(src)/vmlinux.lds $(obj)/head.o $(obj)/misc.o $(obj)/piggy.o FORCE ++$(obj)/vmlinux: $(src)/vmlinux.lds $(obj)/head.o $(obj)/lzma_misc.o $(obj)/piggy.o FORCE + $(call if_changed,ld) + @: + +@@ -33,10 +34,10 @@ $(obj)/vmlinux.bin.all: $(vmlinux.bin.all-y) FORCE + + ifdef CONFIG_RELOCATABLE + $(obj)/vmlinux.bin.gz: $(obj)/vmlinux.bin.all FORCE +- $(call if_changed,gzip) ++ $(call if_changed,lzma) + else + $(obj)/vmlinux.bin.gz: $(obj)/vmlinux.bin FORCE +- $(call if_changed,gzip) ++ $(call if_changed,lzma) + endif + + LDFLAGS_piggy.o := -r --format binary --oformat elf32-i386 -T +diff --git a/arch/i386/boot/compressed/lzma_misc.c b/arch/i386/boot/compressed/lzma_misc.c +new file mode 100644 +index 0000000..4f5f7f9 +--- /dev/null ++++ b/arch/i386/boot/compressed/lzma_misc.c +@@ -0,0 +1,290 @@ ++/* ++ * lzma_misc.c ++ * ++ * Decompress LZMA compressed vmlinuz ++ * Version 0.9 Copyright (c) Ming-Ching Tiew mctiew@yahoo.com ++ * Program adapted from misc.c for 2.6.20.1 kernel ++ * Please refer to misc.c for authorship and copyright. ++ * Date: 25 March 2007 ++ * Source released under GPL ++ */ ++ ++#undef CONFIG_PARAVIRT ++#include <linux/linkage.h> ++#include <linux/vmalloc.h> ++#include <linux/screen_info.h> ++#include <asm/io.h> ++#include <asm/page.h> ++#include <asm/boot.h> ++ ++/* WARNING!! ++ * This code is compiled with -fPIC and it is relocated dynamically ++ * at run time, but no relocation processing is performed. ++ * This means that it is not safe to place pointers in static structures. ++ */ ++ ++#define OF(args) args ++#define STATIC static ++ ++#undef memset ++#undef memcpy ++ ++typedef unsigned char uch; ++typedef unsigned short ush; ++typedef unsigned long ulg; ++ ++#define WSIZE 0x80000000 /* Window size must be at least 32k, ++ * and a power of two ++ * We don't actually have a window just ++ * a huge output buffer so I report ++ * a 2G windows size, as that should ++ * always be larger than our output buffer. ++ */ ++ ++static uch *inbuf; /* input buffer */ ++static uch *window; /* Sliding window buffer, (and final output buffer) */ ++ ++static unsigned insize; /* valid bytes in inbuf */ ++static unsigned inptr; /* index of next byte to be processed in inbuf */ ++ ++/* gzip flag byte */ ++#define ASCII_FLAG 0x01 /* bit 0 set: file probably ASCII text */ ++#define CONTINUATION 0x02 /* bit 1 set: continuation of multi-part gzip file */ ++#define EXTRA_FIELD 0x04 /* bit 2 set: extra field present */ ++#define ORIG_NAME 0x08 /* bit 3 set: original file name present */ ++#define COMMENT 0x10 /* bit 4 set: file comment present */ ++#define ENCRYPTED 0x20 /* bit 5 set: file is encrypted */ ++#define RESERVED 0xC0 /* bit 6,7: reserved */ ++ ++#define get_byte() (inptr < insize ? inbuf[inptr++] : fill_inbuf()) ++ ++/* Diagnostic functions */ ++#ifdef DEBUG ++# define Assert(cond,msg) {if(!(cond)) error(msg);} ++# define Trace(x) fprintf x ++# define Tracev(x) {if (verbose) fprintf x ;} ++# define Tracevv(x) {if (verbose>1) fprintf x ;} ++# define Tracec(c,x) {if (verbose && (c)) fprintf x ;} ++# define Tracecv(c,x) {if (verbose>1 && (c)) fprintf x ;} ++#else ++# define Assert(cond,msg) ++# define Trace(x) ++# define Tracev(x) ++# define Tracevv(x) ++# define Tracec(c,x) ++# define Tracecv(c,x) ++#endif ++ ++static int fill_inbuf(void); ++static void error(char *m); ++ ++/* ++ * This is set up by the setup-routine at boot-time ++ */ ++static unsigned char *real_mode; /* Pointer to real-mode data */ ++ ++#define RM_EXT_MEM_K (*(unsigned short *)(real_mode + 0x2)) ++#ifndef STANDARD_MEMORY_BIOS_CALL ++#define RM_ALT_MEM_K (*(unsigned long *)(real_mode + 0x1e0)) ++#endif ++#define RM_SCREEN_INFO (*(struct screen_info *)(real_mode+0)) ++ ++extern unsigned char input_data[]; ++extern int input_len; ++ ++static long bytes_out = 0; ++ ++static void *memcpy(void *dest, const void *src, unsigned n); ++ ++static void putstr(const char *); ++ ++static unsigned long free_mem_ptr; ++static unsigned long free_mem_end_ptr; ++ ++#define HEAP_SIZE 0x3000 ++ ++static char *vidmem = (char *)0xb8000; ++static int vidport; ++static int lines, cols; ++ ++#ifdef CONFIG_X86_NUMAQ ++void *xquad_portio; ++#endif ++ ++static void scroll(void) ++{ ++ int i; ++ ++ memcpy ( vidmem, vidmem + cols * 2, ( lines - 1 ) * cols * 2 ); ++ for ( i = ( lines - 1 ) * cols * 2; i < lines * cols * 2; i += 2 ) ++ vidmem[i] = ' '; ++} ++ ++static void putstr(const char *s) ++{ ++ int x,y,pos; ++ char c; ++ ++ x = RM_SCREEN_INFO.orig_x; ++ y = RM_SCREEN_INFO.orig_y; ++ ++ while ( ( c = *s++ ) != '\0' ) { ++ if ( c == '\n' ) { ++ x = 0; ++ if ( ++y >= lines ) { ++ scroll(); ++ y--; ++ } ++ } else { ++ vidmem [ ( x + cols * y ) * 2 ] = c; ++ if ( ++x >= cols ) { ++ x = 0; ++ if ( ++y >= lines ) { ++ scroll(); ++ y--; ++ } ++ } ++ } ++ } ++ ++ RM_SCREEN_INFO.orig_x = x; ++ RM_SCREEN_INFO.orig_y = y; ++ ++ pos = (x + cols * y) * 2; /* Update cursor position */ ++ outb_p(14, vidport); ++ outb_p(0xff & (pos >> 9), vidport+1); ++ outb_p(15, vidport); ++ outb_p(0xff & (pos >> 1), vidport+1); ++} ++ ++static void* memcpy(void* dest, const void* src, unsigned n) ++{ ++ int i; ++ char *d = (char *)dest, *s = (char *)src; ++ ++ for (i=0;i<n;i++) d[i] = s[i]; ++ return dest; ++} ++ ++/* =========================================================================== ++ * Fill the input buffer. This is called only when the buffer is empty ++ * and at least one byte is really needed. ++ */ ++static int fill_inbuf(void) ++{ ++ error("ran out of input data"); ++ return 0; ++} ++ ++/* =========================================================================== ++ */ ++static void error(char *x) ++{ ++ putstr("\n\n"); ++ putstr(x); ++ putstr("\n\n -- System halted"); ++ ++ while(1); /* Halt */ ++} ++ ++#define _LZMA_IN_CB ++#include "LzmaDecode.h" ++#include "LzmaDecode.c" ++ ++static int read_byte(void *object, const unsigned char **buffer, SizeT *bufferSize); ++ ++/* ++ * Do the lzma decompression ++ */ ++static int lzma_unzip(uch* output) ++{ ++ ++ unsigned int i; ++ CLzmaDecoderState state; ++ unsigned int uncompressedSize = 0; ++ unsigned char* p; ++ ++ ILzmaInCallback callback; ++ callback.Read = read_byte; ++ ++ // lzma args ++ i = get_byte(); ++ state.Properties.lc = i % 9, i = i / 9; ++ state.Properties.lp = i % 5, state.Properties.pb = i / 5; ++ ++ // skip dictionary size ++ for (i = 0; i < 4; i++) ++ get_byte(); ++ // get uncompressed size ++ p= (char*)&uncompressedSize; ++ for (i = 0; i < 4; i++) ++ *p++ = get_byte(); ++ ++ // skip high order bytes ++ for (i = 0; i < 4; i++) ++ get_byte(); ++ ++ // Just point it beyond ++ state.Probs = (CProb*) ( free_mem_ptr ); ++ // decompress kernel ++ if (LzmaDecode( &state, &callback, ++ (unsigned char*)output, uncompressedSize, &i) == LZMA_RESULT_OK) ++ { ++ if ( i != uncompressedSize ) ++ error( "kernel corrupted!\n"); ++ bytes_out = i; ++ return 0; ++ } ++ return 1; ++} ++ ++ ++static int read_byte(void *object, const unsigned char **buffer, SizeT *bufferSize) ++{ ++ static unsigned int i = 0; ++ static unsigned char val; ++ *bufferSize = 1; ++ val = get_byte(); ++ *buffer = &val; ++ return LZMA_RESULT_OK; ++} ++ ++asmlinkage void decompress_kernel(void *rmode, unsigned long end, ++ uch *input_data, unsigned long input_len, uch *output) ++{ ++ real_mode = rmode; ++ ++ if (RM_SCREEN_INFO.orig_video_mode == 7) { ++ vidmem = (char *) 0xb0000; ++ vidport = 0x3b4; ++ } else { ++ vidmem = (char *) 0xb8000; ++ vidport = 0x3d4; ++ } ++ ++ lines = RM_SCREEN_INFO.orig_video_lines; ++ cols = RM_SCREEN_INFO.orig_video_cols; ++ ++ window = output; /* Output buffer (Normally at 1M) */ ++ free_mem_ptr = end; /* Heap */ ++ free_mem_end_ptr = end + HEAP_SIZE; ++ inbuf = input_data; /* Input buffer */ ++ insize = input_len; ++ inptr = 0; ++ ++ if ((u32)output & (CONFIG_PHYSICAL_ALIGN -1)) ++ error("Destination address not CONFIG_PHYSICAL_ALIGN aligned"); ++ if (end > ((-__PAGE_OFFSET-(512 <<20)-1) & 0x7fffffff)) ++ error("Destination address too large"); ++#ifndef CONFIG_RELOCATABLE ++ if ((u32)output != LOAD_PHYSICAL_ADDR) ++ error("Wrong destination address"); ++#endif ++ if( lzma_unzip(output) != 0 ) ++ { ++ error("inflate error\n"); ++ } ++ putstr("Ok, booting the kernel.\n"); ++ ++ return; ++} +diff --git a/arch/i386/boot/compressed/vmlinux.scr b/arch/i386/boot/compressed/vmlinux.scr +index 707a88f..9d67263 100644 +--- a/arch/i386/boot/compressed/vmlinux.scr ++++ b/arch/i386/boot/compressed/vmlinux.scr +@@ -3,8 +3,8 @@ SECTIONS + .data.compressed : { + input_len = .; + LONG(input_data_end - input_data) input_data = .; ++ output_len = . + 5; + *(.data) +- output_len = . - 4; + input_data_end = .; + } + } +diff --git a/drivers/block/Kconfig b/drivers/block/Kconfig +index 17ee97f..64b7bda 100644 +--- a/drivers/block/Kconfig ++++ b/drivers/block/Kconfig +@@ -406,6 +406,47 @@ config BLK_DEV_RAM_BLOCKSIZE + setups function - apparently needed by the rd_load_image routine + that supposes the filesystem in the image uses a 1024 blocksize. + ++config LZMA_INITRD ++ boolean "Allow LZMA compression on initrd" ++ depends on BLK_DEV_INITRD=y ++ default "y" ++ help ++ Use lzma compression on initrd, example 'lzma e initrd initrd.7z -d16'. ++ If you have sufficient memory, you could compress using bigger dictionary size, ++ 'lzma e initrd initrd.7z'. ++ ++config LZMA_INITRD_KMALLOC_ONLY ++ boolean "Use only kmalloc, do not use vmalloc on lzma initrd" ++ depends on LZMA_INITRD=y ++ default "n" ++ help ++ Set to y if you do not want to use vmalloc, ie use only kmalloc. ++ ++config LZMA_INITRAM_FS ++ boolean "Allow LZMA compression on initramfs" ++ depends on BLK_DEV_RAM=y ++ default "y" ++ help ++ Use lzma compression on initramfs, example 'lzma e initramfs.cpio initramfs.cpio.lzma'. ++ ++config LZMA_INITRAM_FS_SMALLMEM ++ boolean "Use lzma compression with small dictonary size." ++ depends on LZMA_INITRAM_FS=y ++ default "y" ++ help ++ Use lzma compression on initramfs with small dictionary size, example ++ 'lzma e initramfs.cpio initramfs.cpio.lzma -d16'. ++ Affects only the initramfs.cpio in the ~usr directory, which is compiled into ++ the kernel. If you prepared initramfs.cpio for use with bootloader, you would ++ need to specify the commandline options (-d16) yourself. ++ ++config LZMA_INITRAM_FS_KMALLOC_ONLY ++ boolean "Use only kmalloc, do not use vmalloc on lzma initramfs" ++ depends on LZMA_INITRAM_FS=y ++ default "n" ++ help ++ Set to y if you do not want to use vmalloc, ie use only kmalloc. ++ + config CDROM_PKTCDVD + tristate "Packet writing on CD/DVD media" + depends on !UML +diff --git a/fs/Kconfig b/fs/Kconfig +index 3c4886b..bdcc6fb 100644 +--- a/fs/Kconfig ++++ b/fs/Kconfig +@@ -1371,6 +1371,71 @@ config CRAMFS + + If unsure, say N. + ++config SQUASHFS ++ tristate "SquashFS 3.2 - Squashed file system support" ++ select ZLIB_INFLATE ++ help ++ Saying Y here includes support for SquashFS 3.2 (a Compressed Read-Only File ++ System). Squashfs is a highly compressed read-only filesystem for Linux. ++ It uses zlib compression to compress both files, inodes and directories. ++ Inodes in the system are very small and all blocks are packed to minimise ++ data overhead. Block sizes greater than 4K are supported up to a maximum of 64K. ++ SquashFS 3.1 supports 64 bit filesystems and files (larger than 4GB), full ++ uid/gid information, hard links and timestamps. ++ ++ Squashfs is intended for general read-only filesystem use, for archival ++ use (i.e. in cases where a .tar.gz file may be used), and in embedded ++ systems where low overhead is needed. Further information and filesystem tools ++ are available from http://squashfs.sourceforge.net. ++ ++ If you want to compile this as a module ( = code which can be ++ inserted in and removed from the running kernel whenever you want), ++ say M here and read <file:Documentation/modules.txt>. The module ++ will be called squashfs. Note that the root file system (the one ++ containing the directory /) cannot be compiled as a module. ++ ++ If unsure, say N. ++ ++config SQUASHFS_EMBEDDED ++ ++ bool "Additional options for memory-constrained systems" ++ depends on SQUASHFS ++ default n ++ help ++ Saying Y here allows you to specify cache sizes and how Squashfs ++ allocates memory. This is only intended for memory constrained ++ systems. ++ ++ If unsure, say N. ++ ++config SQUASHFS_FRAGMENT_CACHE_SIZE ++ int "Number of fragments cached" if SQUASHFS_EMBEDDED ++ depends on SQUASHFS ++ default "3" ++ help ++ By default SquashFS caches the last 3 fragments read from ++ the filesystem. Increasing this amount may mean SquashFS ++ has to re-read fragments less often from disk, at the expense ++ of extra system memory. Decreasing this amount will mean ++ SquashFS uses less memory at the expense of extra reads from disk. ++ ++ Note there must be at least one cached fragment. Anything ++ much more than three will probably not make much difference. ++ ++config SQUASHFS_VMALLOC ++ bool "Use Vmalloc rather than Kmalloc" if SQUASHFS_EMBEDDED ++ depends on SQUASHFS ++ default n ++ help ++ By default SquashFS uses kmalloc to obtain fragment cache memory. ++ Kmalloc memory is the standard kernel allocator, but it can fail ++ on memory constrained systems. Because of the way Vmalloc works, ++ Vmalloc can succeed when kmalloc fails. Specifying this option ++ will make SquashFS always use Vmalloc to allocate the ++ fragment cache memory. ++ ++ If unsure, say N. ++ + config VXFS_FS + tristate "FreeVxFS file system support (VERITAS VxFS(TM) compatible)" + depends on BLOCK +@@ -2057,3 +2122,4 @@ source "fs/dlm/Kconfig" + + endmenu + ++source "fs/aufs/Kconfig" +diff --git a/fs/Makefile b/fs/Makefile +index 9edf411..557766f 100644 +--- a/fs/Makefile ++++ b/fs/Makefile +@@ -68,6 +68,7 @@ obj-$(CONFIG_JBD) += jbd/ + obj-$(CONFIG_JBD2) += jbd2/ + obj-$(CONFIG_EXT2_FS) += ext2/ + obj-$(CONFIG_CRAMFS) += cramfs/ ++obj-$(CONFIG_SQUASHFS) += squashfs/ + obj-$(CONFIG_RAMFS) += ramfs/ + obj-$(CONFIG_HUGETLBFS) += hugetlbfs/ + obj-$(CONFIG_CODA_FS) += coda/ +@@ -114,3 +115,4 @@ obj-$(CONFIG_HPPFS) += hppfs/ + obj-$(CONFIG_DEBUG_FS) += debugfs/ + obj-$(CONFIG_OCFS2_FS) += ocfs2/ + obj-$(CONFIG_GFS2_FS) += gfs2/ ++obj-$(CONFIG_AUFS) += aufs/ +diff --git a/fs/aufs/Kconfig b/fs/aufs/Kconfig +new file mode 100644 +index 0000000..3a2121c +--- /dev/null ++++ b/fs/aufs/Kconfig +@@ -0,0 +1,73 @@ ++config AUFS ++ tristate "Another unionfs" ++ help ++ Aufs is a stackable unification filesystem such as Unionfs, ++ which unifies several directories and provides a merged single ++ directory. ++ In the early days, aufs was entirely re-designed and ++ re-implemented Unionfs Version 1.x series. After many original ++ ideas, approaches and improvements, it becomes totally ++ different from Unionfs while keeping the basic features. ++ See Unionfs for the basic features. ++ ++if AUFS ++comment "These options are generated automatically for "#UTS_RELEASE ++ ++config AUFS_FAKE_DM ++ bool "Use simplified (fake) nameidata" ++ depends on AUFS ++ default y ++ help ++ Faking nameidata (VFS internal data), you can get better performance ++ in some cases. ++ ++choice ++ prompt "Maximum number of branches" ++ depends on AUFS ++ default AUFS_BRANCH_MAX_127 ++ help ++ Specifies the maximum number of branches (or member directories) in a single aufs. The larger value consumes more system resources and has an impact to performance. ++config AUFS_BRANCH_MAX_127 ++ bool "127" ++ help ++ Specifies the maximum number of branches (or member directories) in a single aufs. The larger value consumes more system resources and has an impact to performance. ++config AUFS_BRANCH_MAX_511 ++ bool "511" ++ help ++ Specifies the maximum number of branches (or member directories) in a single aufs. The larger value consumes more system resources and has an impact to performance. ++config AUFS_BRANCH_MAX_1023 ++ bool "1023" ++ help ++ Specifies the maximum number of branches (or member directories) in a single aufs. The larger value consumes more system resources and has an impact to performance. ++ ++config AUFS_BRANCH_MAX_32767 ++ bool "32767" ++ help ++ Specifies the maximum number of branches (or member directories) in a single aufs. The larger value consumes more system resources and has an impact to performance. ++endchoice ++config AUFS_DEBUG ++ bool "Debug aufs" ++ depends on AUFS ++ default y ++ help ++ Enable this to compile aufs internal debug code. ++ The performance will be damaged. ++ ++config AUFS_COMPAT ++ bool "Compatibility with Unionfs (obsolete)" ++ depends on AUFS ++ default n ++ help ++ This makes aufs compatible with unionfs-style mount options and some ++ behaviours. ++ The dirs= mount option and =nfsro branch permission flag are always ++ interpreted as br: mount option and =ro flag respectively. The ++ 'debug', 'delete' and 'imap' mount options are ignored. ++ If you disable this option, you will get, ++ - aufs issues a warning about the ignored mount options ++ - the default branch permission flag is set. RW for the first branch, ++ and RO for the rests. ++ - the name of a internal file which represents the directory is ++ 'opaque', becomes '.wh..wh..opq' ++ - the 'diropq=w' mount option is set by default ++endif +diff --git a/fs/aufs/Makefile b/fs/aufs/Makefile +new file mode 100755 +index 0000000..0ee3cd0 +--- /dev/null ++++ b/fs/aufs/Makefile +@@ -0,0 +1,18 @@ ++# AUFS Makefile for the Linux 2.6.16 and later ++# $Id: Makefile,v 1.29 2007/04/23 00:59:50 sfjro Exp $ ++ ++obj-$(CONFIG_AUFS) += aufs.o ++aufs-y := module.o super.o sbinfo.o xino.o \ ++ branch.o cpup.o whout.o plink.o wkq.o dcsub.o vfsub.o \ ++ opts.o \ ++ dentry.o dinfo.o \ ++ file.o f_op.o finfo.o \ ++ dir.o vdir.o \ ++ inode.o i_op.o i_op_add.o i_op_del.o i_op_ren.o iinfo.o \ ++ misc.o ++#xattr.o ++aufs-$(CONFIG_AUFS_SYSAUFS) += sysaufs.o ++aufs-$(CONFIG_AUFS_HINOTIFY) += hinotify.o ++aufs-$(CONFIG_AUFS_EXPORT) += export.o ++#aufs-$(CONFIG_DEBUGFS) += dbgfs.o ++aufs-$(CONFIG_AUFS_DEBUG) += debug.o +diff --git a/fs/aufs/aufs.h b/fs/aufs/aufs.h +new file mode 100755 +index 0000000..79b3b87 +--- /dev/null ++++ b/fs/aufs/aufs.h +@@ -0,0 +1,64 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: aufs.h,v 1.24 2007/05/14 03:41:51 sfjro Exp $ */ ++ ++#ifndef __AUFS_H__ ++#define __AUFS_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/version.h> ++ ++/* limited support before 2.6.16, curretly 2.6.15 only. */ ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,16) ++#define atomic_long_t atomic_t ++#define atomic_long_set atomic_set ++#define timespec_to_ns(ts) ({(long long)(ts)->tv_sec;}) ++#define D_CHILD d_child ++#else ++#define D_CHILD d_u.d_child ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++#include "debug.h" ++ ++#include "branch.h" ++#include "cpup.h" ++#include "dcsub.h" ++#include "dentry.h" ++#include "dir.h" ++#include "file.h" ++#include "inode.h" ++#include "misc.h" ++#include "module.h" ++#include "opts.h" ++#include "super.h" ++#include "sysaufs.h" ++#include "vfsub.h" ++#include "whout.h" ++#include "wkq.h" ++//#include "xattr.h" ++ ++#if defined(CONFIG_AUFS_MODULE) && !defined(CONFIG_AUFS_KSIZE_PATCH) ++#define ksize(p) (-1U) ++#endif ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_H__ */ +diff --git a/fs/aufs/branch.c b/fs/aufs/branch.c +new file mode 100755 +index 0000000..f1ce008 +--- /dev/null ++++ b/fs/aufs/branch.c +@@ -0,0 +1,818 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: branch.c,v 1.49 2007/05/14 03:38:23 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++//#include <linux/namei.h> ++#include "aufs.h" ++ ++static void free_branch(struct aufs_branch *br) ++{ ++ TraceEnter(); ++ ++ if (br->br_xino) ++ fput(br->br_xino); ++ dput(br->br_wh); ++ dput(br->br_plink); ++ mntput(br->br_mnt); ++ DEBUG_ON(br_count(br) || atomic_read(&br->br_wh_running)); ++ kfree(br); ++} ++ ++/* ++ * frees all branches ++ */ ++void free_branches(struct aufs_sbinfo *sbinfo) ++{ ++ aufs_bindex_t bmax; ++ struct aufs_branch **br; ++ ++ TraceEnter(); ++ bmax = sbinfo->si_bend + 1; ++ br = sbinfo->si_branch; ++ while (bmax--) ++ free_branch(*br++); ++} ++ ++/* ++ * find the index of a branch which is specified by @br_id. ++ */ ++int find_brindex(struct super_block *sb, aufs_bindex_t br_id) ++{ ++ aufs_bindex_t bindex, bend; ++ ++ TraceEnter(); ++ ++ bend = sbend(sb); ++ for (bindex = 0; bindex <= bend; bindex++) ++ if (sbr_id(sb, bindex) == br_id) ++ return bindex; ++ return -1; ++} ++ ++/* ++ * test if the @br is readonly or not. ++ */ ++int br_rdonly(struct aufs_branch *br) ++{ ++ return ((br->br_mnt->mnt_sb->s_flags & MS_RDONLY) ++ || !br_writable(br->br_perm)) ++ ? -EROFS : 0; ++} ++ ++/* ++ * returns writable branch index, otherwise an error. ++ * todo: customizable writable-branch-policy ++ */ ++static int find_rw_parent(struct dentry *dentry, aufs_bindex_t bend) ++{ ++ int err; ++ aufs_bindex_t bindex, candidate; ++ struct super_block *sb; ++ struct dentry *parent, *hidden_parent; ++ ++ err = bend; ++ sb = dentry->d_sb; ++ parent = dget_parent(dentry); ++#if 1 // branch policy ++ hidden_parent = au_h_dptr_i(parent, bend); ++ if (hidden_parent && !br_rdonly(stobr(sb, bend))) ++ goto out; /* success */ ++#endif ++ ++ candidate = -1; ++ for (bindex = dbstart(parent); bindex <= bend; bindex++) { ++ hidden_parent = au_h_dptr_i(parent, bindex); ++ if (hidden_parent && !br_rdonly(stobr(sb, bindex))) { ++#if 0 // branch policy ++ if (candidate == -1) ++ candidate = bindex; ++ if (!au_test_perm(hidden_parent->d_inode, MAY_WRITE)) ++ return bindex; ++#endif ++ err = bindex; ++ goto out; /* success */ ++ } ++ } ++#if 0 // branch policy ++ err = candidate; ++ if (candidate != -1) ++ goto out; /* success */ ++#endif ++ err = -EROFS; ++ ++ out: ++ dput(parent); ++ return err; ++} ++ ++int find_rw_br(struct super_block *sb, aufs_bindex_t bend) ++{ ++ aufs_bindex_t bindex; ++ ++ for (bindex = bend; bindex >= 0; bindex--) ++ if (!br_rdonly(stobr(sb, bindex))) ++ return bindex; ++ return -EROFS; ++} ++ ++int find_rw_parent_br(struct dentry *dentry, aufs_bindex_t bend) ++{ ++ int err; ++ ++ err = find_rw_parent(dentry, bend); ++ if (err >= 0) ++ return err; ++ return find_rw_br(dentry->d_sb, bend); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * test if two hidden_dentries have overlapping branches. ++ */ ++//todo: try is_subdir() ++static int do_is_overlap(struct super_block *sb, struct dentry *hidden_d1, ++ struct dentry *hidden_d2) ++{ ++ struct dentry *d; ++ ++ d = hidden_d1; ++ do { ++ if (unlikely(d == hidden_d2)) ++ return 1; ++ d = d->d_parent; // dget_parent() ++ } while (!IS_ROOT(d)); ++ ++ return (d == hidden_d2); ++} ++ ++#if defined(CONFIG_BLK_DEV_LOOP) || defined(CONFIG_BLK_DEV_LOOP_MODULE) ++#include <linux/loop.h> ++static int is_overlap_loopback(struct super_block *sb, struct dentry *hidden_d1, ++ struct dentry *hidden_d2) ++{ ++ struct inode *hidden_inode; ++ struct loop_device *l; ++ ++ hidden_inode = hidden_d1->d_inode; ++ if (MAJOR(hidden_inode->i_sb->s_dev) != LOOP_MAJOR) ++ return 0; ++ ++ l = hidden_inode->i_sb->s_bdev->bd_disk->private_data; ++ hidden_d1 = l->lo_backing_file->f_dentry; ++ if (unlikely(hidden_d1->d_sb == sb)) ++ return 1; ++ return do_is_overlap(sb, hidden_d1, hidden_d2); ++} ++#else ++#define is_overlap_loopback(sb, hidden_d1, hidden_d2) 0 ++#endif ++ ++static int is_overlap(struct super_block *sb, struct dentry *hidden_d1, ++ struct dentry *hidden_d2) ++{ ++ LKTRTrace("d1 %.*s, d2 %.*s\n", DLNPair(hidden_d1), DLNPair(hidden_d2)); ++ if (unlikely(hidden_d1 == hidden_d2)) ++ return 1; ++ return do_is_overlap(sb, hidden_d1, hidden_d2) ++ || do_is_overlap(sb, hidden_d2, hidden_d1) ++ || is_overlap_loopback(sb, hidden_d1, hidden_d2) ++ || is_overlap_loopback(sb, hidden_d2, hidden_d1); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int init_br_wh(struct super_block *sb, aufs_bindex_t bindex, ++ struct aufs_branch *br, int new_perm, ++ struct dentry *h_root, struct vfsmount *h_mnt) ++{ ++ int err, old_perm; ++ struct inode *dir = sb->s_root->d_inode, ++ *h_dir = h_root->d_inode; ++ const int new = (bindex < 0); ++ ++ LKTRTrace("b%d, new_perm %d\n", bindex, new_perm); ++ ++ if (new) ++ hi_lock_parent(h_dir); ++ else ++ hdir_lock(h_dir, dir, bindex); ++ ++ br_wh_write_lock(br); ++ old_perm = br->br_perm; ++ br->br_perm = new_perm; ++ err = init_wh(h_root, br, au_do_nfsmnt(h_mnt), sb); ++ br->br_perm = old_perm; ++ br_wh_write_unlock(br); ++ ++ if (new) ++ i_unlock(h_dir); ++ else ++ hdir_unlock(h_dir, dir, bindex); ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * returns a newly allocated branch. @new_nbranch is a number of branches ++ * after adding a branch. ++ */ ++static struct aufs_branch *alloc_addbr(struct super_block *sb, int new_nbranch) ++{ ++ struct aufs_branch **branchp, *add_branch; ++ int sz; ++ void *p; ++ struct dentry *root; ++ struct inode *inode; ++ struct aufs_hinode *hinodep; ++ struct aufs_hdentry *hdentryp; ++ ++ LKTRTrace("new_nbranch %d\n", new_nbranch); ++ SiMustWriteLock(sb); ++ root = sb->s_root; ++ DiMustWriteLock(root); ++ inode = root->d_inode; ++ IiMustWriteLock(inode); ++ ++ add_branch = kmalloc(sizeof(*add_branch), GFP_KERNEL); ++ //if (LktrCond) {kfree(add_branch); add_branch = NULL;} ++ if (unlikely(!add_branch)) ++ goto out; ++ ++ sz = sizeof(*branchp) * (new_nbranch - 1); ++ if (unlikely(!sz)) ++ sz = sizeof(*branchp); ++ p = stosi(sb)->si_branch; ++ branchp = au_kzrealloc(p, sz, sizeof(*branchp) * new_nbranch, ++ GFP_KERNEL); ++ //if (LktrCond) branchp = NULL; ++ if (unlikely(!branchp)) ++ goto out; ++ stosi(sb)->si_branch = branchp; ++ ++ sz = sizeof(*hdentryp) * (new_nbranch - 1); ++ if (unlikely(!sz)) ++ sz = sizeof(*hdentryp); ++ p = dtodi(root)->di_hdentry; ++ hdentryp = au_kzrealloc(p, sz, sizeof(*hdentryp) * new_nbranch, ++ GFP_KERNEL); ++ //if (LktrCond) hdentryp = NULL; ++ if (unlikely(!hdentryp)) ++ goto out; ++ dtodi(root)->di_hdentry = hdentryp; ++ ++ sz = sizeof(*hinodep) * (new_nbranch - 1); ++ if (unlikely(!sz)) ++ sz = sizeof(*hinodep); ++ p = itoii(inode)->ii_hinode; ++ hinodep = au_kzrealloc(p, sz, sizeof(*hinodep) * new_nbranch, ++ GFP_KERNEL); ++ //if (LktrCond) hinodep = NULL; // unavailable test ++ if (unlikely(!hinodep)) ++ goto out; ++ itoii(inode)->ii_hinode = hinodep; ++ return add_branch; /* success */ ++ ++ out: ++ kfree(add_branch); ++ TraceErr(-ENOMEM); ++ return ERR_PTR(-ENOMEM); ++} ++ ++/* ++ * test if the branch permission is legal or not. ++ */ ++static int test_br(struct super_block *sb, struct inode *inode, int brperm, ++ char *path) ++{ ++ int err; ++ ++ err = 0; ++ if (unlikely(br_writable(brperm) && IS_RDONLY(inode))) { ++ Err("write permission for readonly fs or inode, %s\n", path); ++ err = -EINVAL; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * retunrs,,, ++ * 0: success, the caller will add it ++ * plus: success, it is already unified, the caller should ignore it ++ * minus: error ++ */ ++static int test_add(struct super_block *sb, struct opt_add *add, int remount) ++{ ++ int err; ++ struct dentry *root; ++ struct inode *inode, *hidden_inode; ++ aufs_bindex_t bend, bindex; ++ ++ LKTRTrace("%s, remo%d\n", add->path, remount); ++ ++ root = sb->s_root; ++ if (unlikely(au_find_dbindex(root, add->nd.dentry) != -1)) { ++ err = 1; ++ if (!remount) { ++ err = -EINVAL; ++ Err("%s duplicated\n", add->path); ++ } ++ goto out; ++ } ++ ++ err = -ENOSPC; //-E2BIG; ++ bend = sbend(sb); ++ //if (LktrCond) bend = AUFS_BRANCH_MAX; ++ if (unlikely(AUFS_BRANCH_MAX <= add->bindex ++ || AUFS_BRANCH_MAX - 1 <= bend)) { ++ Err("number of branches exceeded %s\n", add->path); ++ goto out; ++ } ++ ++ err = -EDOM; ++ if (unlikely(add->bindex < 0 || bend + 1 < add->bindex)) { ++ Err("bad index %d\n", add->bindex); ++ goto out; ++ } ++ ++ inode = add->nd.dentry->d_inode; ++ DEBUG_ON(!inode || !S_ISDIR(inode->i_mode)); ++ err = -ENOENT; ++ if (unlikely(!inode->i_nlink)) { ++ Err("no existence %s\n", add->path); ++ goto out; ++ } ++ ++ err = -EINVAL; ++ if (unlikely(inode->i_sb == sb)) { ++ Err("%s must be outside\n", add->path); ++ goto out; ++ } ++ ++#if 1 //ndef CONFIG_AUFS_ROBR ++ if (unlikely(au_is_aufs(inode->i_sb) ++ || !strcmp(au_sbtype(inode->i_sb), "unionfs"))) { ++ Err("nested " AUFS_NAME " %s\n", add->path); ++ goto out; ++ } ++#endif ++ ++#ifdef AuNoNfsBranch ++ if (unlikely(au_is_nfs(inode->i_sb))) { ++ Err(AuNoNfsBranchMsg ". %s\n", add->path); ++ goto out; ++ } ++#endif ++ ++ err = test_br(sb, add->nd.dentry->d_inode, add->perm, add->path); ++ if (unlikely(err)) ++ goto out; ++ ++ if (unlikely(bend == -1)) ++ return 0; /* success */ ++ ++ hidden_inode = au_h_dptr(root)->d_inode; ++ if (unlikely(au_flag_test(sb, AuFlag_WARN_PERM) ++ && ((hidden_inode->i_mode & S_IALLUGO) ++ != (inode->i_mode & S_IALLUGO) ++ || hidden_inode->i_uid != inode->i_uid ++ || hidden_inode->i_gid != inode->i_gid))) ++ Warn("uid/gid/perm %s %u/%u/0%o, %u/%u/0%o\n", ++ add->path, ++ inode->i_uid, inode->i_gid, (inode->i_mode & S_IALLUGO), ++ hidden_inode->i_uid, hidden_inode->i_gid, ++ (hidden_inode->i_mode & S_IALLUGO)); ++ ++ err = -EINVAL; ++ for (bindex = 0; bindex <= bend; bindex++) ++ if (unlikely(is_overlap(sb, add->nd.dentry, ++ au_h_dptr_i(root, bindex)))) { ++ Err("%s is overlapped\n", add->path); ++ goto out; ++ } ++ err = 0; ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++int br_add(struct super_block *sb, struct opt_add *add, int remount) ++{ ++ int err, sz; ++ aufs_bindex_t bend, add_bindex; ++ struct dentry *root; ++ struct aufs_iinfo *iinfo; ++ struct aufs_sbinfo *sbinfo; ++ struct aufs_dinfo *dinfo; ++ struct inode *root_inode; ++ unsigned long long maxb; ++ struct aufs_branch **branchp, *add_branch; ++ struct aufs_hdentry *hdentryp; ++ struct aufs_hinode *hinodep; ++ ++ LKTRTrace("b%d, %s, 0x%x, %.*s\n", add->bindex, add->path, ++ add->perm, DLNPair(add->nd.dentry)); ++ SiMustWriteLock(sb); ++ root = sb->s_root; ++ DiMustWriteLock(root); ++ root_inode = root->d_inode; ++ IMustLock(root_inode); ++ IiMustWriteLock(root_inode); ++ ++ err = test_add(sb, add, remount); ++ if (unlikely(err < 0)) ++ goto out; ++ if (unlikely(err)) ++ return 0; /* success */ ++ ++ bend = sbend(sb); ++ add_branch = alloc_addbr(sb, bend + 2); ++ err = PTR_ERR(add_branch); ++ if (IS_ERR(add_branch)) ++ goto out; ++ ++ err = 0; ++ rw_init_nolock(&add_branch->br_wh_rwsem); ++ add_branch->br_wh = add_branch->br_plink = NULL; ++ if (unlikely(br_writable(add->perm))) { ++ err = init_br_wh(sb, /*bindex*/-1, add_branch, add->perm, ++ add->nd.dentry, add->nd.mnt); ++ if (unlikely(err)) { ++ kfree(add_branch); ++ goto out; ++ } ++ } ++ add_branch->br_xino = NULL; ++ add_branch->br_mnt = mntget(add->nd.mnt); ++ atomic_set(&add_branch->br_wh_running, 0); ++ add_branch->br_id = new_br_id(sb); ++ add_branch->br_perm = add->perm; ++ atomic_set(&add_branch->br_count, 0); ++ ++ sbinfo = stosi(sb); ++ dinfo = dtodi(root); ++ iinfo = itoii(root_inode); ++ ++ add_bindex = add->bindex; ++ sz = sizeof(*(sbinfo->si_branch)) * (bend + 1 - add_bindex); ++ branchp = sbinfo->si_branch + add_bindex; ++ memmove(branchp + 1, branchp, sz); ++ *branchp = add_branch; ++ sz = sizeof(*hdentryp) * (bend + 1 - add_bindex); ++ hdentryp = dinfo->di_hdentry + add_bindex; ++ memmove(hdentryp + 1, hdentryp, sz); ++ hdentryp->hd_dentry = NULL; ++ sz = sizeof(*hinodep) * (bend + 1 - add_bindex); ++ hinodep = iinfo->ii_hinode + add_bindex; ++ memmove(hinodep + 1, hinodep, sz); ++ hinodep->hi_inode = NULL; ++ hinodep->hi_notify = NULL; ++ ++ sbinfo->si_bend++; ++ dinfo->di_bend++; ++ iinfo->ii_bend++; ++ if (unlikely(bend == -1)) { ++ dinfo->di_bstart = 0; ++ iinfo->ii_bstart = 0; ++ } ++ set_h_dptr(root, add_bindex, dget(add->nd.dentry)); ++ set_h_iptr(root_inode, add_bindex, igrab(add->nd.dentry->d_inode), 0); ++ if (!add_bindex) ++ au_cpup_attr_all(root_inode); ++ else ++ au_add_nlink(root_inode, add->nd.dentry->d_inode); ++ maxb = add->nd.dentry->d_sb->s_maxbytes; ++ if (sb->s_maxbytes < maxb) ++ sb->s_maxbytes = maxb; ++ ++ if (au_flag_test(sb, AuFlag_XINO)) { ++ struct file *base_file = stobr(sb, 0)->br_xino; ++ if (!add_bindex) ++ base_file = stobr(sb, 1)->br_xino; ++ err = xino_init(sb, add_bindex, base_file, /*do_test*/1); ++ if (unlikely(err)) { ++ DEBUG_ON(add_branch->br_xino); ++ Err("ignored xino err %d, force noxino\n", err); ++ err = 0; ++ au_flag_clr(sb, AuFlag_XINO); ++ } ++ } ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * test if the branch is deletable or not. ++ */ ++static int test_children_busy(struct dentry *root, aufs_bindex_t bindex) ++{ ++ int err, i, j, sigen; ++ struct au_dcsub_pages dpages; ++ ++ LKTRTrace("b%d\n", bindex); ++ SiMustWriteLock(root->d_sb); ++ DiMustWriteLock(root); ++ ++ err = au_dpages_init(&dpages, GFP_KERNEL); ++ if (unlikely(err)) ++ goto out; ++ err = au_dcsub_pages(&dpages, root, NULL, NULL); ++ if (unlikely(err)) ++ goto out_dpages; ++ ++ sigen = au_sigen(root->d_sb); ++ DiMustNoWaiters(root); ++ IiMustNoWaiters(root->d_inode); ++ di_write_unlock(root); ++ for (i = 0; !err && i < dpages.ndpage; i++) { ++ struct au_dpage *dpage; ++ dpage = dpages.dpages + i; ++ for (j = 0; !err && j < dpage->ndentry; j++) { ++ struct dentry *d; ++ ++ d = dpage->dentries[j]; ++ if (au_digen(d) == sigen) ++ di_read_lock_child(d, AUFS_I_RLOCK); ++ else { ++ di_write_lock_child(d); ++ err = au_reval_dpath(d, sigen); ++ if (!err) ++ di_downgrade_lock(d, AUFS_I_RLOCK); ++ else { ++ di_write_unlock(d); ++ break; ++ } ++ } ++ ++ if (au_h_dptr_i(d, bindex) ++ && (!S_ISDIR(d->d_inode->i_mode) ++ || dbstart(d) == dbend(d))) ++ err = -EBUSY; ++ di_read_unlock(d, AUFS_I_RLOCK); ++ if (err) ++ LKTRTrace("%.*s\n", DLNPair(d)); ++ } ++ } ++ di_write_lock_child(root); /* aufs_write_lock() calls ..._child() */ ++ ++ out_dpages: ++ au_dpages_free(&dpages); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++int br_del(struct super_block *sb, struct opt_del *del, int remount) ++{ ++ int err, do_wh, rerr; ++ struct dentry *root; ++ struct inode *inode, *hidden_dir; ++ aufs_bindex_t bindex, bend, br_id; ++ struct aufs_sbinfo *sbinfo; ++ struct aufs_dinfo *dinfo; ++ struct aufs_iinfo *iinfo; ++ struct aufs_branch *br; ++ ++ LKTRTrace("%s, %.*s\n", del->path, DLNPair(del->h_root)); ++ SiMustWriteLock(sb); ++ root = sb->s_root; ++ DiMustWriteLock(root); ++ inode = root->d_inode; ++ IiMustWriteLock(inode); ++ ++ bindex = au_find_dbindex(root, del->h_root); ++ if (unlikely(bindex < 0)) { ++ if (remount) ++ return 0; /* success */ ++ err = -ENOENT; ++ Err("%s no such branch\n", del->path); ++ goto out; ++ } ++ LKTRTrace("bindex b%d\n", bindex); ++ ++ err = -EBUSY; ++ bend = sbend(sb); ++ br = stobr(sb, bindex); ++ if (unlikely(!bend || br_count(br))) { ++ LKTRTrace("bend %d, br_count %d\n", bend, br_count(br)); ++ goto out; ++ } ++ ++ do_wh = 0; ++ hidden_dir = del->h_root->d_inode; ++ if (unlikely(br->br_wh || br->br_plink)) { ++#if 0 ++ /* remove whiteout base */ ++ err = init_br_wh(sb, bindex, br, AuBr_RO, del->h_root, ++ br->br_mnt); ++ if (unlikely(err)) ++ goto out; ++#else ++ dput(br->br_wh); ++ dput(br->br_plink); ++ br->br_wh = br->br_plink = NULL; ++#endif ++ do_wh = 1; ++ } ++ ++ err = test_children_busy(root, bindex); ++ if (unlikely(err)) { ++ if (unlikely(do_wh)) ++ goto out_wh; ++ goto out; ++ } ++ ++ err = 0; ++ sbinfo = stosi(sb); ++ dinfo = dtodi(root); ++ iinfo = itoii(inode); ++ ++ dput(au_h_dptr_i(root, bindex)); ++ aufs_hiput(iinfo->ii_hinode + bindex); ++ br_id = br->br_id; ++ free_branch(br); ++ ++ //todo: realloc and shrink memeory ++ if (bindex < bend) { ++ const aufs_bindex_t n = bend - bindex; ++ struct aufs_branch **brp; ++ struct aufs_hdentry *hdp; ++ struct aufs_hinode *hip; ++ ++ brp = sbinfo->si_branch + bindex; ++ memmove(brp, brp + 1, sizeof(*brp) * n); ++ hdp = dinfo->di_hdentry + bindex; ++ memmove(hdp, hdp + 1, sizeof(*hdp) * n); ++ hip = iinfo->ii_hinode + bindex; ++ memmove(hip, hip + 1, sizeof(*hip) * n); ++ } ++ sbinfo->si_branch[0 + bend] = NULL; ++ dinfo->di_hdentry[0 + bend].hd_dentry = NULL; ++ iinfo->ii_hinode[0 + bend].hi_inode = NULL; ++ iinfo->ii_hinode[0 + bend].hi_notify = NULL; ++ ++ sbinfo->si_bend--; ++ dinfo->di_bend--; ++ iinfo->ii_bend--; ++ if (!bindex) ++ au_cpup_attr_all(inode); ++ else ++ au_sub_nlink(inode, del->h_root->d_inode); ++ if (au_flag_test(sb, AuFlag_PLINK)) ++ half_refresh_plink(sb, br_id); ++ ++ if (sb->s_maxbytes == del->h_root->d_sb->s_maxbytes) { ++ bend--; ++ sb->s_maxbytes = 0; ++ for (bindex = 0; bindex <= bend; bindex++) { ++ unsigned long long maxb; ++ maxb = sbr_sb(sb, bindex)->s_maxbytes; ++ if (sb->s_maxbytes < maxb) ++ sb->s_maxbytes = maxb; ++ } ++ } ++ goto out; /* success */ ++ ++ out_wh: ++ /* revert */ ++ rerr = init_br_wh(sb, bindex, br, br->br_perm, del->h_root, br->br_mnt); ++ if (rerr) ++ Warn("failed re-creating base whiteout, %s. (%d)\n", ++ del->path, rerr); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static int do_need_sigen_inc(int a, int b) ++{ ++ return (br_whable(a) && !br_whable(b)); ++} ++ ++static int need_sigen_inc(int old, int new) ++{ ++ return (do_need_sigen_inc(old, new) ++ || do_need_sigen_inc(new, old)); ++} ++ ++int br_mod(struct super_block *sb, struct opt_mod *mod, int remount, ++ int *do_update) ++{ ++ int err; ++ struct dentry *root; ++ aufs_bindex_t bindex; ++ struct aufs_branch *br; ++ struct inode *hidden_dir; ++ ++ LKTRTrace("%s, %.*s, 0x%x\n", ++ mod->path, DLNPair(mod->h_root), mod->perm); ++ SiMustWriteLock(sb); ++ root = sb->s_root; ++ DiMustWriteLock(root); ++ IiMustWriteLock(root->d_inode); ++ ++ bindex = au_find_dbindex(root, mod->h_root); ++ if (unlikely(bindex < 0)) { ++ if (remount) ++ return 0; /* success */ ++ err = -ENOENT; ++ Err("%s no such branch\n", mod->path); ++ goto out; ++ } ++ LKTRTrace("bindex b%d\n", bindex); ++ ++ hidden_dir = mod->h_root->d_inode; ++ err = test_br(sb, hidden_dir, mod->perm, mod->path); ++ if (unlikely(err)) ++ goto out; ++ ++ br = stobr(sb, bindex); ++ if (unlikely(br->br_perm == mod->perm)) ++ return 0; /* success */ ++ ++ if (br_writable(br->br_perm)) { ++#if 1 ++ /* remove whiteout base */ ++ //todo: mod->perm? ++ err = init_br_wh(sb, bindex, br, AuBr_RO, mod->h_root, ++ br->br_mnt); ++ if (unlikely(err)) ++ goto out; ++#else ++ dput(br->br_wh); ++ dput(br->br_plink); ++ br->br_wh = br->br_plink = NULL; ++#endif ++ ++ if (!br_writable(mod->perm)) { ++ /* rw --> ro, file might be mmapped */ ++ struct file *file, *hf; ++ ++#if 1 // test here ++ DiMustNoWaiters(root); ++ IiMustNoWaiters(root->d_inode); ++ di_write_unlock(root); ++ ++ // no need file_list_lock() since sbinfo is locked ++ //file_list_lock(); ++ list_for_each_entry(file, &sb->s_files, f_u.fu_list) { ++ LKTRTrace("%.*s\n", DLNPair(file->f_dentry)); ++ fi_read_lock(file); ++ if (!S_ISREG(file->f_dentry->d_inode->i_mode) ++ || !(file->f_mode & FMODE_WRITE) ++ || fbstart(file) != bindex) { ++ FiMustNoWaiters(file); ++ fi_read_unlock(file); ++ continue; ++ } ++ ++ // todo: already flushed? ++ hf = au_h_fptr(file); ++ hf->f_flags = au_file_roflags(hf->f_flags); ++ hf->f_mode &= ~FMODE_WRITE; ++ FiMustNoWaiters(file); ++ fi_read_unlock(file); ++ } ++ //file_list_unlock(); ++ ++ /* aufs_write_lock() calls ..._child() */ ++ di_write_lock_child(root); ++#endif ++ } ++ } ++ ++ *do_update |= need_sigen_inc(br->br_perm, mod->perm); ++ br->br_perm = mod->perm; ++ return err; /* success */ ++ ++ out: ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/branch.h b/fs/aufs/branch.h +new file mode 100755 +index 0000000..2557836 +--- /dev/null ++++ b/fs/aufs/branch.h +@@ -0,0 +1,235 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: branch.h,v 1.30 2007/05/14 03:41:51 sfjro Exp $ */ ++ ++#ifndef __AUFS_BRANCH_H__ ++#define __AUFS_BRANCH_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/mount.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++#include "misc.h" ++#include "super.h" ++ ++/* protected by superblock rwsem */ ++struct aufs_branch { ++ struct file *br_xino; ++ readf_t br_xino_read; ++ writef_t br_xino_write; ++ ++ aufs_bindex_t br_id; ++ ++ int br_perm; ++ struct vfsmount *br_mnt; ++ atomic_t br_count; ++ ++ /* whiteout base */ ++ struct aufs_rwsem br_wh_rwsem; ++ struct dentry *br_wh; ++ atomic_t br_wh_running; ++ ++ /* pseudo-link dir */ ++ struct dentry *br_plink; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* branch permission and attribute */ ++enum { ++ AuBr_RW, /* writable, linkable wh */ ++ AuBr_RO, /* readonly, no wh */ ++ AuBr_RR, /* natively readonly, no wh */ ++ ++ AuBr_RWNoLinkWH, /* un-linkable whiteouts */ ++ ++ AuBr_ROWH, ++ AuBr_RRWH, /* whiteout-able */ ++ ++ AuBr_Last ++}; ++ ++static inline int br_writable(int brperm) ++{ ++ return (brperm == AuBr_RW ++ || brperm == AuBr_RWNoLinkWH); ++} ++ ++static inline int br_whable(int brperm) ++{ ++ return (brperm == AuBr_RW ++ || brperm == AuBr_ROWH ++ || brperm == AuBr_RRWH); ++} ++ ++static inline int br_linkable_wh(int brperm) ++{ ++ return (brperm == AuBr_RW); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#define _AuNoNfsBranchMsg "NFS branch is not supported" ++#if LINUX_VERSION_CODE == KERNEL_VERSION(2,6,15) ++#define AuNoNfsBranch ++#define AuNoNfsBranchMsg _AuNoNfsBranchMsg ++#elif LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,19) \ ++ && !defined(CONFIG_AUFS_LHASH_PATCH) ++#define AuNoNfsBranch ++#define AuNoNfsBranchMsg _AuNoNfsBranchMsg \ ++ ", try lhash.patch and CONFIG_AUFS_LHASH_PATCH" ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct aufs_sbinfo; ++void free_branches(struct aufs_sbinfo *sinfo); ++int br_rdonly(struct aufs_branch *br); ++int find_brindex(struct super_block *sb, aufs_bindex_t br_id); ++int find_rw_br(struct super_block *sb, aufs_bindex_t bend); ++int find_rw_parent_br(struct dentry *dentry, aufs_bindex_t bend); ++struct opt_add; ++int br_add(struct super_block *sb, struct opt_add *add, int remount); ++struct opt_del; ++int br_del(struct super_block *sb, struct opt_del *del, int remount); ++struct opt_mod; ++int br_mod(struct super_block *sb, struct opt_mod *mod, int remount, ++ int *do_update); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline int br_count(struct aufs_branch *br) ++{ ++ return atomic_read(&br->br_count); ++} ++ ++static inline void br_get(struct aufs_branch *br) ++{ ++ atomic_inc(&br->br_count); ++} ++ ++static inline void br_put(struct aufs_branch *br) ++{ ++ atomic_dec(&br->br_count); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* Superblock to branch */ ++static inline aufs_bindex_t sbr_id(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return stobr(sb, bindex)->br_id; ++} ++ ++static inline ++struct vfsmount *sbr_mnt(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return stobr(sb, bindex)->br_mnt; ++} ++ ++static inline ++struct super_block *sbr_sb(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return sbr_mnt(sb, bindex)->mnt_sb; ++} ++ ++#if 0 ++static inline int sbr_count(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return br_count(stobr(sb, bindex)); ++} ++ ++static inline void sbr_get(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ br_get(stobr(sb, bindex)); ++} ++#endif ++ ++static inline void sbr_put(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ br_put(stobr(sb, bindex)); ++} ++ ++static inline int sbr_perm(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return stobr(sb, bindex)->br_perm; ++} ++ ++static inline int sbr_is_whable(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return br_whable(sbr_perm(sb, bindex)); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_LHASH_PATCH ++static inline struct vfsmount *au_do_nfsmnt(struct vfsmount *h_mnt) ++{ ++ if (!au_is_nfs(h_mnt->mnt_sb)) ++ return NULL; ++ return h_mnt; ++} ++ ++/* it doesn't mntget() */ ++static inline ++struct vfsmount *au_nfsmnt(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return au_do_nfsmnt(sbr_mnt(sb, bindex)); ++} ++#else ++static inline struct vfsmount *au_do_nfsmnt(struct vfsmount *h_mnt) ++{ ++ return NULL; ++} ++ ++static inline ++struct vfsmount *au_nfsmnt(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ return NULL; ++} ++#endif /* CONFIG_AUFS_LHASH_PATCH */ ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * br_wh_read_lock, br_wh_write_lock ++ * br_wh_read_unlock, br_wh_write_unlock, br_wh_downgrade_lock ++ */ ++SimpleRwsemFuncs(br_wh, struct aufs_branch *br, br->br_wh_rwsem); ++ ++/* to debug easier, do not make them inlined functions */ ++#define BrWhMustReadLock(br) do { \ ++ /* SiMustAnyLock(sb); */ \ ++ RwMustReadLock(&(br)->br_wh_rwsem); \ ++} while (0) ++ ++#define BrWhMustWriteLock(br) do { \ ++ /* SiMustAnyLock(sb); */ \ ++ RwMustWriteLock(&(br)->br_wh_rwsem); \ ++} while (0) ++ ++#define BrWhMustAnyLock(br) do { \ ++ /* SiMustAnyLock(sb); */ \ ++ RwMustAnyLock(&(br)->br_wh_rwsem); \ ++} while (0) ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_BRANCH_H__ */ +diff --git a/fs/aufs/cpup.c b/fs/aufs/cpup.c +new file mode 100755 +index 0000000..6636f40 +--- /dev/null ++++ b/fs/aufs/cpup.c +@@ -0,0 +1,773 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: cpup.c,v 1.37 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#include <asm/uaccess.h> ++#include "aufs.h" ++ ++/* violent cpup_attr_*() functions don't care inode lock */ ++void au_cpup_attr_timesizes(struct inode *inode) ++{ ++ struct inode *hidden_inode; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ //IMustLock(inode); ++ hidden_inode = au_h_iptr(inode); ++ DEBUG_ON(!hidden_inode); ++ //IMustLock(!hidden_inode); ++ ++ inode->i_atime = hidden_inode->i_atime; ++ inode->i_mtime = hidden_inode->i_mtime; ++ inode->i_ctime = hidden_inode->i_ctime; ++ spin_lock(&inode->i_lock); ++ i_size_write(inode, i_size_read(hidden_inode)); ++ inode->i_blocks = hidden_inode->i_blocks; ++ spin_unlock(&inode->i_lock); ++} ++ ++void au_cpup_attr_nlink(struct inode *inode) ++{ ++ struct inode *h_inode; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ //IMustLock(inode); ++ DEBUG_ON(!inode->i_mode); ++ ++ h_inode = au_h_iptr(inode); ++ inode->i_nlink = h_inode->i_nlink; ++ ++ /* ++ * fewer nlink makes find(1) noisy, but larger nlink doesn't. ++ * it may includes whplink directory. ++ */ ++ if (unlikely(S_ISDIR(h_inode->i_mode))) { ++ aufs_bindex_t bindex, bend; ++ bend = ibend(inode); ++ for (bindex = ibstart(inode) + 1; bindex <= bend; bindex++) { ++ h_inode = au_h_iptr_i(inode, bindex); ++ if (h_inode) ++ au_add_nlink(inode, h_inode); ++ } ++ } ++} ++ ++void au_cpup_attr_changable(struct inode *inode) ++{ ++ struct inode *hidden_inode; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ //IMustLock(inode); ++ hidden_inode = au_h_iptr(inode); ++ DEBUG_ON(!hidden_inode); ++ ++ inode->i_mode = hidden_inode->i_mode; ++ inode->i_uid = hidden_inode->i_uid; ++ inode->i_gid = hidden_inode->i_gid; ++ au_cpup_attr_timesizes(inode); ++ ++ //?? ++ inode->i_flags = hidden_inode->i_flags; ++} ++ ++void au_cpup_igen(struct inode *inode, struct inode *h_inode) ++{ ++ inode->i_generation = h_inode->i_generation; ++ itoii(inode)->ii_hsb1 = h_inode->i_sb; ++} ++ ++void au_cpup_attr_all(struct inode *inode) ++{ ++ struct inode *hidden_inode; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ //IMustLock(inode); ++ hidden_inode = au_h_iptr(inode); ++ DEBUG_ON(!hidden_inode); ++ ++ au_cpup_attr_changable(inode); ++ if (inode->i_nlink > 0) ++ au_cpup_attr_nlink(inode); ++ ++ switch (inode->i_mode & S_IFMT) { ++ case S_IFBLK: ++ case S_IFCHR: ++ inode->i_rdev = hidden_inode->i_rdev; ++ } ++ inode->i_blkbits = hidden_inode->i_blkbits; ++ au_cpup_attr_blksize(inode, hidden_inode); ++ au_cpup_igen(inode, hidden_inode); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* Note: dt_dentry and dt_hidden_dentry are not dget/dput-ed */ ++ ++/* keep the timestamps of the parent dir when cpup */ ++void dtime_store(struct dtime *dt, struct dentry *dentry, ++ struct dentry *hidden_dentry) ++{ ++ struct inode *inode; ++ ++ TraceEnter(); ++ DEBUG_ON(!dentry || !hidden_dentry || !hidden_dentry->d_inode); ++ ++ dt->dt_dentry = dentry; ++ dt->dt_h_dentry = hidden_dentry; ++ inode = hidden_dentry->d_inode; ++ dt->dt_atime = inode->i_atime; ++ dt->dt_mtime = inode->i_mtime; ++ //smp_mb(); ++} ++ ++// todo: remove extra parameter ++void dtime_revert(struct dtime *dt, int h_parent_is_locked) ++{ ++ struct iattr attr; ++ int err; ++ struct dentry *dentry; ++ ++ LKTRTrace("h_parent locked %d\n", h_parent_is_locked); ++ ++ attr.ia_atime = dt->dt_atime; ++ attr.ia_mtime = dt->dt_mtime; ++ attr.ia_valid = ATTR_FORCE | ATTR_MTIME | ATTR_MTIME_SET ++ | ATTR_ATIME | ATTR_ATIME_SET; ++ //smp_mb(); ++ dentry = NULL; ++ if (!h_parent_is_locked /* && !IS_ROOT(dt->dt_dentry) */) ++ dentry = dt->dt_dentry; ++ err = vfsub_notify_change(dt->dt_h_dentry, &attr, ++ need_dlgt(dt->dt_dentry->d_sb)); ++ if (unlikely(err)) ++ Warn("restoring timestamps failed(%d). ignored\n", err); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int cpup_iattr(struct dentry *hidden_dst, struct dentry *hidden_src, ++ int dlgt) ++{ ++ int err; ++ struct iattr ia; ++ struct inode *hidden_isrc, *hidden_idst; ++ ++ LKTRTrace("%.*s\n", DLNPair(hidden_dst)); ++ hidden_idst = hidden_dst->d_inode; ++ //IMustLock(hidden_idst); ++ hidden_isrc = hidden_src->d_inode; ++ //IMustLock(hidden_isrc); ++ ++ ia.ia_valid = ATTR_FORCE | ATTR_MODE | ATTR_UID | ATTR_GID ++ | ATTR_ATIME | ATTR_MTIME ++ | ATTR_ATIME_SET | ATTR_MTIME_SET; ++ ia.ia_mode = hidden_isrc->i_mode; ++ ia.ia_uid = hidden_isrc->i_uid; ++ ia.ia_gid = hidden_isrc->i_gid; ++ ia.ia_atime = hidden_isrc->i_atime; ++ ia.ia_mtime = hidden_isrc->i_mtime; ++ err = vfsub_notify_change(hidden_dst, &ia, dlgt); ++ //if (LktrCond) err = -1; ++ if (!err) ++ hidden_idst->i_flags = hidden_isrc->i_flags; //?? ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * to support a sparse file which is opened with O_APPEND, ++ * we need to close the file. ++ */ ++static int cpup_regular(struct dentry *dentry, aufs_bindex_t bdst, ++ aufs_bindex_t bsrc, loff_t len) ++{ ++ int err, i, sparse; ++ struct super_block *sb; ++ struct inode *hidden_inode; ++ enum {SRC, DST}; ++ struct { ++ aufs_bindex_t bindex; ++ unsigned int flags; ++ struct dentry *dentry; ++ struct file *file; ++ void *label, *label_file; ++ } *h, hidden[] = { ++ { ++ .bindex = bsrc, ++ .flags = O_RDONLY | O_NOATIME | O_LARGEFILE, ++ .file = NULL, ++ .label = &&out, ++ .label_file = &&out_src_file ++ }, ++ { ++ .bindex = bdst, ++ .flags = O_WRONLY | O_NOATIME | O_LARGEFILE, ++ .file = NULL, ++ .label = &&out_src_file, ++ .label_file = &&out_dst_file ++ } ++ }; ++ ++ LKTRTrace("dentry %.*s, bdst %d, bsrc %d, len %lld\n", ++ DLNPair(dentry), bdst, bsrc, len); ++ DEBUG_ON(bsrc <= bdst); ++ DEBUG_ON(!len); ++ sb = dentry->d_sb; ++ DEBUG_ON(test_ro(sb, bdst, dentry->d_inode)); ++ // bsrc branch can be ro/rw. ++ ++ h = hidden; ++ for (i = 0; i < 2; i++, h++) { ++ h->dentry = au_h_dptr_i(dentry, h->bindex); ++ DEBUG_ON(!h->dentry); ++ hidden_inode = h->dentry->d_inode; ++ DEBUG_ON(!hidden_inode || !S_ISREG(hidden_inode->i_mode)); ++ h->file = hidden_open(dentry, h->bindex, h->flags); ++ //if (LktrCond) ++ //{fput(h->file); sbr_put(sb, h->bindex); h->file = ERR_PTR(-1);} ++ err = PTR_ERR(h->file); ++ if (IS_ERR(h->file)) ++ goto *h->label; ++ err = -EINVAL; ++ if (unlikely(!h->file->f_op)) ++ goto *h->label_file; ++ } ++ ++ /* stop updating while we copyup */ ++ IMustLock(hidden[SRC].dentry->d_inode); ++ sparse = 0; ++ err = au_copy_file(hidden[DST].file, hidden[SRC].file, len, sb, ++ &sparse); ++ ++ /* sparse file: update i_blocks next time */ ++ if (unlikely(!err && sparse)) ++ d_drop(dentry); ++ ++ out_dst_file: ++ fput(hidden[DST].file); ++ sbr_put(sb, hidden[DST].bindex); ++ out_src_file: ++ fput(hidden[SRC].file); ++ sbr_put(sb, hidden[SRC].bindex); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++// unnecessary? ++unsigned int au_flags_cpup(unsigned int init, struct dentry *parent) ++{ ++ if (unlikely(parent && IS_ROOT(parent))) ++ init |= CPUP_LOCKED_GHDIR; ++ return init; ++} ++ ++/* return with hidden dst inode is locked */ ++static int cpup_entry(struct dentry *dentry, aufs_bindex_t bdst, ++ aufs_bindex_t bsrc, loff_t len, unsigned int flags, ++ int dlgt) ++{ ++ int err, isdir, symlen; ++ struct dentry *hidden_src, *hidden_dst, *hidden_parent, *parent; ++ struct inode *hidden_inode, *hidden_dir, *dir; ++ struct dtime dt; ++ umode_t mode; ++ char *sym; ++ mm_segment_t old_fs; ++ const int do_dt = flags & CPUP_DTIME; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, i%lu, bdst %d, bsrc %d, len %Ld, flags 0x%x\n", ++ DLNPair(dentry), dentry->d_inode->i_ino, bdst, bsrc, len, ++ flags); ++ sb = dentry->d_sb; ++ DEBUG_ON(bdst >= bsrc || test_ro(sb, bdst, NULL)); ++ // bsrc branch can be ro/rw. ++ ++ hidden_src = au_h_dptr_i(dentry, bsrc); ++ DEBUG_ON(!hidden_src); ++ hidden_inode = hidden_src->d_inode; ++ DEBUG_ON(!hidden_inode); ++ ++ /* stop refrencing while we are creating */ ++ //parent = dget_parent(dentry); ++ parent = dentry->d_parent; ++ dir = parent->d_inode; ++ hidden_dst = au_h_dptr_i(dentry, bdst); ++ DEBUG_ON(hidden_dst && hidden_dst->d_inode); ++ //hidden_parent = dget_parent(hidden_dst); ++ hidden_parent = hidden_dst->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ ++ if (do_dt) ++ dtime_store(&dt, parent, hidden_parent); ++ ++ isdir = 0; ++ mode = hidden_inode->i_mode; ++ switch (mode & S_IFMT) { ++ case S_IFREG: ++ /* stop updating while we are referencing */ ++ IMustLock(hidden_inode); ++ err = vfsub_create(hidden_dir, hidden_dst, mode | S_IWUSR, NULL, ++ dlgt); ++ //if (LktrCond) {vfs_unlink(hidden_dir, hidden_dst); err = -1;} ++ if (!err) { ++ loff_t l = i_size_read(hidden_inode); ++ if (len == -1 || l < len) ++ len = l; ++ if (len) { ++ err = cpup_regular(dentry, bdst, bsrc, len); ++ //if (LktrCond) err = -1; ++ } ++ if (unlikely(err)) { ++ int rerr; ++ rerr = vfsub_unlink(hidden_dir, hidden_dst, ++ dlgt); ++ if (rerr) { ++ IOErr("failed unlinking cpup-ed %.*s" ++ "(%d, %d)\n", ++ DLNPair(hidden_dst), err, rerr); ++ err = -EIO; ++ } ++ } ++ } ++ break; ++ case S_IFDIR: ++ isdir = 1; ++ err = vfsub_mkdir(hidden_dir, hidden_dst, mode, dlgt); ++ //if (LktrCond) {vfs_rmdir(hidden_dir, hidden_dst); err = -1;} ++ if (!err) { ++ /* setattr case: dir is not locked */ ++ if (0 && ibstart(dir) == bdst) ++ au_cpup_attr_nlink(dir); ++ au_cpup_attr_nlink(dentry->d_inode); ++ } ++ break; ++ case S_IFLNK: ++ err = -ENOMEM; ++ sym = __getname(); ++ //if (LktrCond) {__putname(sym); sym = NULL;} ++ if (unlikely(!sym)) ++ break; ++ old_fs = get_fs(); ++ set_fs(KERNEL_DS); ++ err = symlen = hidden_inode->i_op->readlink ++ (hidden_src, (char __user*)sym, PATH_MAX); ++ //if (LktrCond) err = symlen = -1; ++ set_fs(old_fs); ++ if (symlen > 0) { ++ sym[symlen] = 0; ++ err = vfsub_symlink(hidden_dir, hidden_dst, sym, mode, ++ dlgt); ++ //if (LktrCond) ++ //{vfs_unlink(hidden_dir, hidden_dst); err = -1;} ++ } ++ __putname(sym); ++ break; ++ case S_IFCHR: ++ case S_IFBLK: ++ DEBUG_ON(!capable(CAP_MKNOD)); ++ /*FALLTHROUGH*/ ++ case S_IFIFO: ++ case S_IFSOCK: ++ err = vfsub_mknod(hidden_dir, hidden_dst, mode, ++ hidden_inode->i_rdev, dlgt); ++ //if (LktrCond) {vfs_unlink(hidden_dir, hidden_dst); err = -1;} ++ break; ++ default: ++ IOErr("Unknown inode type 0%o\n", mode); ++ err = -EIO; ++ } ++ ++ if (do_dt) ++ dtime_revert(&dt, flags & CPUP_LOCKED_GHDIR); ++ //dput(parent); ++ //dput(hidden_parent); ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * copyup the @dentry from @bsrc to @bdst. ++ * the caller must set the both of hidden dentries. ++ * @len is for trucating when it is -1 copyup the entire file. ++ */ ++int cpup_single(struct dentry *dentry, aufs_bindex_t bdst, aufs_bindex_t bsrc, ++ loff_t len, unsigned int flags) ++{ ++ int err, rerr, isdir, dlgt; ++ struct dentry *hidden_src, *hidden_dst, *parent;//, *h_parent; ++ struct inode *dst_inode, *hidden_dir, *inode, *src_inode; ++ struct super_block *sb; ++ aufs_bindex_t old_ibstart; ++ struct dtime dt; ++ ++ LKTRTrace("%.*s, i%lu, bdst %d, bsrc %d, len %Ld, flags 0x%x\n", ++ DLNPair(dentry), dentry->d_inode->i_ino, bdst, bsrc, len, ++ flags); ++ sb = dentry->d_sb; ++ DEBUG_ON(bsrc <= bdst); ++ hidden_dst = au_h_dptr_i(dentry, bdst); ++ DEBUG_ON(!hidden_dst || hidden_dst->d_inode); ++ //h_parent = dget_parent(hidden_dst); ++ //hidden_dir = h_parent->d_inode; ++ hidden_dir = hidden_dst->d_parent->d_inode; ++ IMustLock(hidden_dir); ++ hidden_src = au_h_dptr_i(dentry, bsrc); ++ DEBUG_ON(!hidden_src || !hidden_src->d_inode); ++ inode = dentry->d_inode; ++ IiMustWriteLock(inode); ++ ++ dlgt = need_dlgt(sb); ++ dst_inode = au_h_iptr_i(inode, bdst); ++ if (unlikely(dst_inode)) { ++ if (unlikely(!au_flag_test(sb, AuFlag_PLINK))) { ++ err = -EIO; ++ IOErr("i%lu exists on a upper branch " ++ "but plink is disabled\n", inode->i_ino); ++ goto out; ++ } ++ ++ if (dst_inode->i_nlink) { ++ hidden_src = lkup_plink(sb, bdst, inode); ++ err = PTR_ERR(hidden_src); ++ if (IS_ERR(hidden_src)) ++ goto out; ++ DEBUG_ON(!hidden_src->d_inode); ++ // vfs_link() does lock the inode ++ err = vfsub_link(hidden_src, hidden_dir, hidden_dst, dlgt); ++ dput(hidden_src); ++ goto out; ++ } else ++ /* udba work */ ++ au_update_brange(inode, 1); ++ } ++ ++ old_ibstart = ibstart(inode); ++ err = cpup_entry(dentry, bdst, bsrc, len, flags, dlgt); ++ if (unlikely(err)) ++ goto out; ++ dst_inode = hidden_dst->d_inode; ++ hi_lock_child2(dst_inode); ++ ++ //todo: test dlgt ++ err = cpup_iattr(hidden_dst, hidden_src, dlgt); ++ //if (LktrCond) err = -1; ++#if 0 // xattr ++ if (0 && !err) ++ err = cpup_xattrs(hidden_src, hidden_dst); ++#endif ++ isdir = S_ISDIR(dst_inode->i_mode); ++ if (!err) { ++ if (bdst < old_ibstart) ++ set_ibstart(inode, bdst); ++ set_h_iptr(inode, bdst, igrab(dst_inode), ++ au_hi_flags(inode, isdir)); ++ i_unlock(dst_inode); ++ src_inode = hidden_src->d_inode; ++ if (!isdir) { ++ if (src_inode->i_nlink > 1 ++ && au_flag_test(sb, AuFlag_PLINK)) ++ append_plink(sb, inode, hidden_dst, bdst); ++ else { ++ /* braces are added to stop a warning */ ++ ;//xino_write0(sb, bsrc, src_inode->i_ino); ++ /* ignore this error */ ++ } ++ } ++ //goto out; /* success */ ++ return 0; /* success */ ++ } ++ ++ /* revert */ ++ i_unlock(dst_inode); ++ parent = dget_parent(dentry); ++ //dtime_store(&dt, parent, h_parent); ++ dtime_store(&dt, parent, hidden_dst->d_parent); ++ dput(parent); ++ if (!isdir) ++ rerr = vfsub_unlink(hidden_dir, hidden_dst, dlgt); ++ else ++ rerr = vfsub_rmdir(hidden_dir, hidden_dst, dlgt); ++ //rerr = -1; ++ dtime_revert(&dt, flags & CPUP_LOCKED_GHDIR); ++ if (rerr) { ++ IOErr("failed removing broken entry(%d, %d)\n", err, rerr); ++ err = -EIO; ++ } ++ ++ out: ++ //dput(h_parent); ++ TraceErr(err); ++ return err; ++} ++ ++struct cpup_single_args { ++ int *errp; ++ struct dentry *dentry; ++ aufs_bindex_t bdst, bsrc; ++ loff_t len; ++ unsigned int flags; ++}; ++ ++static void call_cpup_single(void *args) ++{ ++ struct cpup_single_args *a = args; ++ *a->errp = cpup_single(a->dentry, a->bdst, a->bsrc, a->len, a->flags); ++} ++ ++int sio_cpup_single(struct dentry *dentry, aufs_bindex_t bdst, ++ aufs_bindex_t bsrc, loff_t len, unsigned int flags) ++{ ++ int err; ++ struct dentry *hidden_dentry; ++ umode_t mode; ++ ++ LKTRTrace("%.*s, i%lu, bdst %d, bsrc %d, len %Ld, flags 0x%x\n", ++ DLNPair(dentry), dentry->d_inode->i_ino, bdst, bsrc, len, ++ flags); ++ ++ hidden_dentry = au_h_dptr_i(dentry, bsrc); ++ mode = hidden_dentry->d_inode->i_mode & S_IFMT; ++ if ((mode != S_IFCHR && mode != S_IFBLK) ++ || capable(CAP_MKNOD)) ++ err = cpup_single(dentry, bdst, bsrc, len, flags); ++ else { ++ struct cpup_single_args args = { ++ .errp = &err, ++ .dentry = dentry, ++ .bdst = bdst, ++ .bsrc = bsrc, ++ .len = len, ++ .flags = flags ++ }; ++ au_wkq_wait(call_cpup_single, &args, /*dlgt*/0); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * copyup the @dentry from the first active hidden branch to @bdst, ++ * using cpup_single(). ++ */ ++int cpup_simple(struct dentry *dentry, aufs_bindex_t bdst, loff_t len, ++ unsigned int flags) ++{ ++ int err; ++ struct inode *inode; ++ aufs_bindex_t bsrc, bend; ++ ++ LKTRTrace("%.*s, bdst %d, len %Ld, flags 0x%x\n", ++ DLNPair(dentry), bdst, len, flags); ++ inode = dentry->d_inode; ++ DEBUG_ON(!S_ISDIR(inode->i_mode) && dbstart(dentry) < bdst); ++ ++ bend = dbend(dentry); ++ for (bsrc = bdst + 1; bsrc <= bend; bsrc++) ++ if (au_h_dptr_i(dentry, bsrc)) ++ break; ++ DEBUG_ON(!au_h_dptr_i(dentry, bsrc)); ++ ++ err = lkup_neg(dentry, bdst); ++ //err = -1; ++ if (!err) { ++ err = cpup_single(dentry, bdst, bsrc, len, flags); ++ if (!err) ++ return 0; /* success */ ++ ++ /* revert */ ++ set_h_dptr(dentry, bdst, NULL); ++ set_dbstart(dentry, bsrc); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++struct cpup_simple_args { ++ int *errp; ++ struct dentry *dentry; ++ aufs_bindex_t bdst; ++ loff_t len; ++ unsigned int flags; ++}; ++ ++static void call_cpup_simple(void *args) ++{ ++ struct cpup_simple_args *a = args; ++ *a->errp = cpup_simple(a->dentry, a->bdst, a->len, a->flags); ++} ++ ++int sio_cpup_simple(struct dentry *dentry, aufs_bindex_t bdst, loff_t len, ++ unsigned int flags) ++{ ++ int err, do_sio, dlgt; ++ //struct dentry *parent; ++ struct inode *hidden_dir, *dir; ++ ++ LKTRTrace("%.*s, b%d, len %Ld, flags 0x%x\n", ++ DLNPair(dentry), bdst, len, flags); ++ ++ //parent = dget_parent(dentry); ++ //dir = parent->d_inode; ++ dir = dentry->d_parent->d_inode; ++ hidden_dir = au_h_iptr_i(dir, bdst); ++ dlgt = need_dlgt(dir->i_sb); ++ do_sio = au_test_perm(hidden_dir, MAY_EXEC | MAY_WRITE, dlgt); ++ if (!do_sio) { ++ umode_t mode = dentry->d_inode->i_mode & S_IFMT; ++ do_sio = ((mode == S_IFCHR || mode == S_IFBLK) ++ && !capable(CAP_MKNOD)); ++ } ++ if (!do_sio) ++ err = cpup_simple(dentry, bdst, len, flags); ++ else { ++ struct cpup_simple_args args = { ++ .errp = &err, ++ .dentry = dentry, ++ .bdst = bdst, ++ .len = len, ++ .flags = flags ++ }; ++ au_wkq_wait(call_cpup_simple, &args, /*dlgt*/0); ++ } ++ ++ //dput(parent); ++ TraceErr(err); ++ return err; ++} ++ ++//todo: dcsub ++/* cf. revalidate function in file.c */ ++int cpup_dirs(struct dentry *dentry, aufs_bindex_t bdst, struct dentry *locked) ++{ ++ int err; ++ struct super_block *sb; ++ struct dentry *d, *parent, *hidden_parent; ++ unsigned int udba; ++ ++ LKTRTrace("%.*s, b%d, parent i%lu, locked %p\n", ++ DLNPair(dentry), bdst, parent_ino(dentry), locked); ++ sb = dentry->d_sb; ++ DEBUG_ON(test_ro(sb, bdst, NULL)); ++ parent = dentry->d_parent; ++ IiMustWriteLock(parent->d_inode); ++ if (unlikely(IS_ROOT(parent))) ++ return 0; ++ if (locked) { ++ DiMustAnyLock(locked); ++ IiMustAnyLock(locked->d_inode); ++ } ++ ++ /* slow loop, keep it simple and stupid */ ++ err = 0; ++ udba = au_flag_test(sb, AuFlag_UDBA_INOTIFY); ++ while (1) { ++ parent = dentry->d_parent; // dget_parent() ++ hidden_parent = au_h_dptr_i(parent, bdst); ++ if (hidden_parent) ++ return 0; /* success */ ++ ++ /* find top dir which is needed to cpup */ ++ do { ++ d = parent; ++ parent = d->d_parent; // dget_parent() ++ if (parent != locked) ++ di_read_lock_parent3(parent, !AUFS_I_RLOCK); ++ hidden_parent = au_h_dptr_i(parent, bdst); ++ if (parent != locked) ++ di_read_unlock(parent, !AUFS_I_RLOCK); ++ } while (!hidden_parent); ++ ++ if (d != dentry->d_parent) ++ di_write_lock_child3(d); ++ ++ /* somebody else might create while we were sleeping */ ++ if (!au_h_dptr_i(d, bdst) || !au_h_dptr_i(d, bdst)->d_inode) { ++ struct inode *h_dir = hidden_parent->d_inode, ++ *dir = parent->d_inode, ++ *h_gdir, *gdir; ++ ++ if (au_h_dptr_i(d, bdst)) ++ au_update_dbstart(d); ++ //DEBUG_ON(dbstart(d) <= bdst); ++ if (parent != locked) ++ di_read_lock_parent3(parent, AUFS_I_RLOCK); ++ h_gdir = gdir = NULL; ++ if (unlikely(udba && !IS_ROOT(parent))) { ++ gdir = parent->d_parent->d_inode; ++ h_gdir = hidden_parent->d_parent->d_inode; ++ hgdir_lock(h_gdir, gdir, bdst); ++ } ++ hdir_lock(h_dir, dir, bdst); ++ err = sio_cpup_simple(d, bdst, -1, ++ au_flags_cpup(CPUP_DTIME, ++ parent)); ++ //if (LktrCond) err = -1; ++ hdir_unlock(h_dir, dir, bdst); ++ if (unlikely(gdir)) ++ hdir_unlock(h_gdir, gdir, bdst); ++ if (parent != locked) ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ } ++ ++ if (d != dentry->d_parent) ++ di_write_unlock(d); ++ if (unlikely(err)) ++ break; ++ } ++ ++// out: ++ TraceErr(err); ++ return err; ++} ++ ++int test_and_cpup_dirs(struct dentry *dentry, aufs_bindex_t bdst, ++ struct dentry *locked) ++{ ++ int err; ++ struct dentry *parent; ++ struct inode *dir; ++ ++ parent = dentry->d_parent; ++ dir = parent->d_inode; ++ LKTRTrace("%.*s, b%d, parent i%lu, locked %p\n", ++ DLNPair(dentry), bdst, dir->i_ino, locked); ++ DiMustReadLock(parent); ++ IiMustReadLock(dir); ++ ++ if (au_h_iptr_i(dir, bdst)) ++ return 0; ++ ++ err = 0; ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ di_write_lock_parent(parent); ++ if (au_h_iptr_i(dir, bdst)) ++ goto out; ++ ++ err = cpup_dirs(dentry, bdst, locked); ++ ++ out: ++ di_downgrade_lock(parent, AUFS_I_RLOCK); ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/cpup.h b/fs/aufs/cpup.h +new file mode 100755 +index 0000000..86557aa +--- /dev/null ++++ b/fs/aufs/cpup.h +@@ -0,0 +1,72 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: cpup.h,v 1.15 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_CPUP_H__ ++#define __AUFS_CPUP_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++ ++static inline ++void au_cpup_attr_blksize(struct inode *inode, struct inode *h_inode) ++{ ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,19) ++ inode->i_blksize = h_inode->i_blksize; ++#endif ++} ++ ++void au_cpup_attr_timesizes(struct inode *inode); ++void au_cpup_attr_nlink(struct inode *inode); ++void au_cpup_attr_changable(struct inode *inode); ++void au_cpup_igen(struct inode *inode, struct inode *h_inode); ++void au_cpup_attr_all(struct inode *inode); ++ ++#define CPUP_DTIME 1 // do dtime_store/revert ++// todo: remove this ++#define CPUP_LOCKED_GHDIR 2 // grand parent hidden dir is locked ++unsigned int au_flags_cpup(unsigned int init, struct dentry *parent); ++ ++int cpup_single(struct dentry *dentry, aufs_bindex_t bdst, aufs_bindex_t bsrc, ++ loff_t len, unsigned int flags); ++int sio_cpup_single(struct dentry *dentry, aufs_bindex_t bdst, ++ aufs_bindex_t bsrc, loff_t len, unsigned int flags); ++int cpup_simple(struct dentry *dentry, aufs_bindex_t bdst, loff_t len, ++ unsigned int flags); ++int sio_cpup_simple(struct dentry *dentry, aufs_bindex_t bdst, loff_t len, ++ unsigned int flags); ++ ++int cpup_dirs(struct dentry *dentry, aufs_bindex_t bdst, struct dentry *locked); ++int test_and_cpup_dirs(struct dentry *dentry, aufs_bindex_t bdst, ++ struct dentry *locked); ++ ++/* keep timestamps when copyup */ ++struct dtime { ++ struct dentry *dt_dentry, *dt_h_dentry; ++ struct timespec dt_atime, dt_mtime; ++}; ++void dtime_store(struct dtime *dt, struct dentry *dentry, ++ struct dentry *h_dentry); ++void dtime_revert(struct dtime *dt, int h_parent_is_locked); ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_CPUP_H__ */ +diff --git a/fs/aufs/dcsub.c b/fs/aufs/dcsub.c +new file mode 100755 +index 0000000..6ec29d3 +--- /dev/null ++++ b/fs/aufs/dcsub.c +@@ -0,0 +1,175 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dcsub.c,v 1.3 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++static void au_dpage_free(struct au_dpage *dpage) ++{ ++ int i; ++ ++ TraceEnter(); ++ DEBUG_ON(!dpage); ++ ++ for (i = 0; i < dpage->ndentry; i++) ++ dput(dpage->dentries[i]); ++ free_page((unsigned long)dpage->dentries); ++} ++ ++int au_dpages_init(struct au_dcsub_pages *dpages, gfp_t gfp) ++{ ++ int err; ++ void *p; ++ ++ TraceEnter(); ++ ++ err = -ENOMEM; ++ dpages->dpages = kmalloc(sizeof(*dpages->dpages), gfp); ++ if (unlikely(!dpages->dpages)) ++ goto out; ++ p = (void*)__get_free_page(gfp); ++ if (unlikely(!p)) ++ goto out_dpages; ++ dpages->dpages[0].ndentry = 0; ++ dpages->dpages[0].dentries = p; ++ dpages->ndpage = 1; ++ return 0; /* success */ ++ ++ out_dpages: ++ kfree(dpages->dpages); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++void au_dpages_free(struct au_dcsub_pages *dpages) ++{ ++ int i; ++ ++ TraceEnter(); ++ ++ for (i = 0; i < dpages->ndpage; i++) ++ au_dpage_free(dpages->dpages + i); ++ kfree(dpages->dpages); ++} ++ ++static int au_dpages_append(struct au_dcsub_pages *dpages, ++ struct dentry *dentry, gfp_t gfp) ++{ ++ int err, sz; ++ struct au_dpage *dpage; ++ void *p; ++ ++ //TraceEnter(); ++ ++ dpage = dpages->dpages + dpages->ndpage - 1; ++ DEBUG_ON(!dpage); ++ sz = PAGE_SIZE/sizeof(dentry); ++ if (unlikely(dpage->ndentry >= sz)) { ++ LKTRLabel(new dpage); ++ err = -ENOMEM; ++ sz = dpages->ndpage * sizeof(*dpages->dpages); ++ p = au_kzrealloc(dpages->dpages, sz, ++ sz + sizeof(*dpages->dpages), gfp); ++ if (unlikely(!p)) ++ goto out; ++ dpage = dpages->dpages + dpages->ndpage; ++ p = (void*)__get_free_page(gfp); ++ if (unlikely(!p)) ++ goto out; ++ dpage->ndentry = 0; ++ dpage->dentries = p; ++ dpages->ndpage++; ++ } ++ ++ dpage->dentries[dpage->ndentry++] = dget(dentry); ++ return 0; /* success */ ++ ++ out: ++ //TraceErr(err); ++ return err; ++} ++ ++int au_dcsub_pages(struct au_dcsub_pages *dpages, struct dentry *root, ++ au_dpages_test test, void *arg) ++{ ++ int err; ++ struct dentry *this_parent = root; ++ struct list_head *next; ++ struct super_block *sb = root->d_sb; ++ ++ TraceEnter(); ++ ++ err = 0; ++ spin_lock(&dcache_lock); ++ repeat: ++ next = this_parent->d_subdirs.next; ++ resume: ++ if (this_parent->d_sb == sb ++ && !IS_ROOT(this_parent) ++ && atomic_read(&this_parent->d_count) ++ && this_parent->d_inode ++ && (!test || test(this_parent, arg))) { ++ err = au_dpages_append(dpages, this_parent, GFP_ATOMIC); ++ if (unlikely(err)) ++ goto out; ++ } ++ ++ while (next != &this_parent->d_subdirs) { ++ struct list_head *tmp = next; ++ struct dentry *dentry = list_entry(tmp, struct dentry, D_CHILD); ++ next = tmp->next; ++ if (unlikely(/*d_unhashed(dentry) || */!dentry->d_inode)) ++ continue; ++ if (!list_empty(&dentry->d_subdirs)) { ++ this_parent = dentry; ++ goto repeat; ++ } ++ if (dentry->d_sb == sb ++ && atomic_read(&dentry->d_count) ++ && (!test || test(dentry, arg))) { ++ err = au_dpages_append(dpages, dentry, GFP_ATOMIC); ++ if (unlikely(err)) ++ goto out; ++ } ++ } ++ ++ if (this_parent != root) { ++ next = this_parent->D_CHILD.next; ++ this_parent = this_parent->d_parent; ++ goto resume; ++ } ++ out: ++ spin_unlock(&dcache_lock); ++#if 0 ++ if (!err) { ++ int i, j; ++ j = 0; ++ for (i = 0; i < dpages->ndpage; i++) { ++ if ((dpages->dpages + i)->ndentry) ++ Dbg("%d: %d\n", i, (dpages->dpages + i)->ndentry); ++ j += (dpages->dpages + i)->ndentry; ++ } ++ if (j) ++ Dbg("ndpage %d, %d\n", dpages->ndpage, j); ++ } ++#endif ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/dcsub.h b/fs/aufs/dcsub.h +new file mode 100755 +index 0000000..0ba034b +--- /dev/null ++++ b/fs/aufs/dcsub.h +@@ -0,0 +1,47 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dcsub.h,v 1.2 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_DCSUB_H__ ++#define __AUFS_DCSUB_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/dcache.h> ++ ++struct au_dpage { ++ int ndentry; ++ struct dentry **dentries; ++}; ++ ++struct au_dcsub_pages { ++ int ndpage; ++ struct au_dpage *dpages; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++int au_dpages_init(struct au_dcsub_pages *dpages, gfp_t gfp); ++void au_dpages_free(struct au_dcsub_pages *dpages); ++typedef int (*au_dpages_test)(struct dentry *dentry, void *arg); ++int au_dcsub_pages(struct au_dcsub_pages *dpages, struct dentry *root, ++ au_dpages_test test, void *arg); ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_DCSUB_H__ */ +diff --git a/fs/aufs/debug.c b/fs/aufs/debug.c +new file mode 100755 +index 0000000..99d158b +--- /dev/null ++++ b/fs/aufs/debug.c +@@ -0,0 +1,262 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: debug.c,v 1.27 2007/04/30 05:48:23 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++atomic_t aufs_cond = ATOMIC_INIT(0); ++ ++#if defined(CONFIG_LKTR) || defined(CONFIG_LKTR_MODULE) ++#define dpri(fmt, arg...) \ ++ do {if (LktrCond) printk(KERN_DEBUG fmt, ##arg);} while (0) ++#else ++#define dpri(fmt, arg...) printk(KERN_DEBUG fmt, ##arg) ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++void au_dpri_whlist(struct aufs_nhash *whlist) ++{ ++ int i; ++ struct hlist_head *head; ++ struct aufs_wh *tpos; ++ struct hlist_node *pos; ++ ++ for (i = 0; i < AUFS_NHASH_SIZE; i++) { ++ head = whlist->heads + i; ++ hlist_for_each_entry(tpos, pos, head, wh_hash) ++ dpri("b%d, %.*s, %d\n", ++ tpos->wh_bindex, ++ tpos->wh_str.len, tpos->wh_str.name, ++ tpos->wh_str.len); ++ } ++} ++ ++void au_dpri_vdir(struct aufs_vdir *vdir) ++{ ++ int i; ++ union aufs_deblk_p p; ++ unsigned char *o; ++ ++ if (!vdir || IS_ERR(vdir)) { ++ dpri("err %ld\n", PTR_ERR(vdir)); ++ return; ++ } ++ ++ dpri("nblk %d, deblk %p %d, last{%d, %p}, ver %lu\n", ++ vdir->vd_nblk, vdir->vd_deblk, ksize(vdir->vd_deblk), ++ vdir->vd_last.i, vdir->vd_last.p.p, vdir->vd_version); ++ for (i = 0; i < vdir->vd_nblk; i++) { ++ p.deblk = vdir->vd_deblk[i]; ++ o = p.p; ++ dpri("[%d]: %p %d\n", i, o, ksize(o)); ++#if 0 // verbose ++ int j; ++ for (j = 0; j < 8; j++) { ++ dpri("%p(+%d) {%02x %02x %02x %02x %02x %02x %02x %02x " ++ "%02x %02x %02x %02x %02x %02x %02x %02x}\n", ++ p.p, p.p - o, ++ p.p[0], p.p[1], p.p[2], p.p[3], ++ p.p[4], p.p[5], p.p[6], p.p[7], ++ p.p[8], p.p[9], p.p[10], p.p[11], ++ p.p[12], p.p[13], p.p[14], p.p[15]); ++ p.p += 16; ++ } ++#endif ++ } ++} ++ ++static int do_pri_inode(aufs_bindex_t bindex, struct inode *inode) ++{ ++ if (!inode || IS_ERR(inode)) { ++ dpri("i%d: err %ld\n", bindex, PTR_ERR(inode)); ++ return -1; ++ } ++ ++ /* the type of i_blocks depends upon CONFIG_LSF */ ++ BUILD_BUG_ON(sizeof(inode->i_blocks) != sizeof(unsigned long) ++ && sizeof(inode->i_blocks) != sizeof(u64)); ++ dpri("i%d: i%lu, %s, cnt %d, nl %u, 0%o, sz %Lu, blk %Lu," ++ " ct %Ld, np %lu, st 0x%lx, g %x\n", ++ bindex, ++ inode->i_ino, inode->i_sb ? au_sbtype(inode->i_sb) : "??", ++ atomic_read(&inode->i_count), inode->i_nlink, inode->i_mode, ++ i_size_read(inode), (u64)inode->i_blocks, ++ timespec_to_ns(&inode->i_ctime) & 0x0ffff, ++ inode->i_mapping ? inode->i_mapping->nrpages : 0, ++ inode->i_state, inode->i_generation); ++ return 0; ++} ++ ++void au_dpri_inode(struct inode *inode) ++{ ++ struct aufs_iinfo *iinfo; ++ aufs_bindex_t bindex; ++ int err; ++ ++ err = do_pri_inode(-1, inode); ++ if (err || !au_is_aufs(inode->i_sb)) ++ return; ++ ++ iinfo = itoii(inode); ++ if (!iinfo) ++ return; ++ dpri("i-1: bstart %d, bend %d, gen %d\n", ++ iinfo->ii_bstart, iinfo->ii_bend, au_iigen(inode)); ++ if (iinfo->ii_bstart < 0) ++ return; ++ for (bindex = iinfo->ii_bstart; bindex <= iinfo->ii_bend; bindex++) ++ do_pri_inode(bindex, iinfo->ii_hinode[0 + bindex].hi_inode); ++} ++ ++static int do_pri_dentry(aufs_bindex_t bindex, struct dentry *dentry) ++{ ++ if (!dentry || IS_ERR(dentry)) { ++ dpri("d%d: err %ld\n", bindex, PTR_ERR(dentry)); ++ return -1; ++ } ++ dpri("d%d: %.*s/%.*s, %s, cnt %d, flags 0x%x\n", ++ bindex, ++ DLNPair(dentry->d_parent), DLNPair(dentry), ++ dentry->d_sb ? au_sbtype(dentry->d_sb) : "??", ++ atomic_read(&dentry->d_count), dentry->d_flags); ++ do_pri_inode(bindex, dentry->d_inode); ++ return 0; ++} ++ ++void au_dpri_dentry(struct dentry *dentry) ++{ ++ struct aufs_dinfo *dinfo; ++ aufs_bindex_t bindex; ++ int err; ++ ++ err = do_pri_dentry(-1, dentry); ++ if (err || !au_is_aufs(dentry->d_sb)) ++ return; ++ ++ dinfo = dtodi(dentry); ++ if (!dinfo) ++ return; ++ dpri("d-1: bstart %d, bend %d, bwh %d, bdiropq %d, gen %d\n", ++ dinfo->di_bstart, dinfo->di_bend, ++ dinfo->di_bwh, dinfo->di_bdiropq, au_digen(dentry)); ++ if (dinfo->di_bstart < 0) ++ return; ++ for (bindex = dinfo->di_bstart; bindex <= dinfo->di_bend; bindex++) ++ do_pri_dentry(bindex, dinfo->di_hdentry[0 + bindex].hd_dentry); ++} ++ ++static int do_pri_file(aufs_bindex_t bindex, struct file *file) ++{ ++ char a[32]; ++ ++ if (!file || IS_ERR(file)) { ++ dpri("f%d: err %ld\n", bindex, PTR_ERR(file)); ++ return -1; ++ } ++ a[0] = 0; ++ if (bindex == -1 && ftofi(file)) ++ snprintf(a, sizeof(a), ", mmapped %d", au_is_mmapped(file)); ++ dpri("f%d: mode 0x%x, flags 0%o, cnt %d, pos %Lu%s\n", ++ bindex, file->f_mode, file->f_flags, file_count(file), ++ file->f_pos, a); ++ do_pri_dentry(bindex, file->f_dentry); ++ return 0; ++} ++ ++void au_dpri_file(struct file *file) ++{ ++ struct aufs_finfo *finfo; ++ aufs_bindex_t bindex; ++ int err; ++ ++ err = do_pri_file(-1, file); ++ if (err || !file->f_dentry || !au_is_aufs(file->f_dentry->d_sb)) ++ return; ++ ++ finfo = ftofi(file); ++ if (!finfo) ++ return; ++ if (finfo->fi_bstart < 0) ++ return; ++ for (bindex = finfo->fi_bstart; bindex <= finfo->fi_bend; bindex++) { ++ struct aufs_hfile *hf; ++ //dpri("bindex %d\n", bindex); ++ hf = finfo->fi_hfile + bindex; ++ do_pri_file(bindex, hf ? hf->hf_file : NULL); ++ } ++} ++ ++static int do_pri_br(aufs_bindex_t bindex, struct aufs_branch *br) ++{ ++ struct vfsmount *mnt; ++ struct super_block *sb; ++ ++ if (!br || IS_ERR(br) ++ || !(mnt = br->br_mnt) || IS_ERR(mnt) ++ || !(sb = mnt->mnt_sb) || IS_ERR(sb)) { ++ dpri("s%d: err %ld\n", bindex, PTR_ERR(br)); ++ return -1; ++ } ++ ++ dpri("s%d: {perm 0x%x, cnt %d}, " ++ "%s, flags 0x%lx, cnt(BIAS) %d, active %d, xino %p %p\n", ++ bindex, br->br_perm, br_count(br), ++ au_sbtype(sb), sb->s_flags, sb->s_count - S_BIAS, ++ atomic_read(&sb->s_active), br->br_xino, ++ br->br_xino ? br->br_xino->f_dentry : NULL); ++ return 0; ++} ++ ++void au_dpri_sb(struct super_block *sb) ++{ ++ struct aufs_sbinfo *sbinfo; ++ aufs_bindex_t bindex; ++ int err; ++ struct vfsmount mnt = {.mnt_sb = sb}; ++ struct aufs_branch fake = { ++ .br_perm = 0, ++ .br_mnt = &mnt, ++ .br_count = ATOMIC_INIT(0), ++ .br_xino = NULL ++ }; ++ ++ atomic_set(&fake.br_count, 0); ++ err = do_pri_br(-1, &fake); ++ dpri("dev 0x%x\n", sb->s_dev); ++ if (err || !au_is_aufs(sb)) ++ return; ++ ++ sbinfo = stosi(sb); ++ if (!sbinfo) ++ return; ++ for (bindex = 0; bindex <= sbinfo->si_bend; bindex++) { ++ //dpri("bindex %d\n", bindex); ++ do_pri_br(bindex, sbinfo->si_branch[0 + bindex]); ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++void DbgSleep(int sec) ++{ ++ static DECLARE_WAIT_QUEUE_HEAD(wq); ++ Dbg("sleep %d sec\n", sec); ++ wait_event_timeout(wq, 0, sec * HZ); ++} +diff --git a/fs/aufs/debug.h b/fs/aufs/debug.h +new file mode 100755 +index 0000000..53f5f6a +--- /dev/null ++++ b/fs/aufs/debug.h +@@ -0,0 +1,129 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: debug.h,v 1.31 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_DEBUG_H__ ++#define __AUFS_DEBUG_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++ ++#ifdef CONFIG_AUFS_DEBUG ++#define DEBUG_ON(a) BUG_ON(a) ++extern atomic_t aufs_cond; ++#define au_debug_on() atomic_inc(&aufs_cond) ++#define au_debug_off() atomic_dec(&aufs_cond) ++#define au_is_debug() atomic_read(&aufs_cond) ++#else ++#define DEBUG_ON(a) /* */ ++#define au_debug_on() /* */ ++#define au_debug_off() /* */ ++#define au_is_debug() 0 ++#endif ++ ++#define MtxMustLock(mtx) DEBUG_ON(!mutex_is_locked(mtx)) ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* debug print */ ++#if defined(CONFIG_LKTR) || defined(CONFIG_LKTR_MODULE) ++#include <linux/lktr.h> ++#ifdef CONFIG_AUFS_DEBUG ++#undef LktrCond ++#define LktrCond unlikely((lktr_cond && lktr_cond()) || au_is_debug()) ++#endif ++#else ++#define LktrCond au_is_debug() ++#define LKTRDumpVma(pre, vma, suf) /* */ ++#define LKTRDumpStack() /* */ ++#define LKTRTrace(fmt, args...) do { \ ++ if (LktrCond) \ ++ Dbg(fmt, ##args); \ ++} while (0) ++#define LKTRLabel(label) LKTRTrace("%s\n", #label) ++#endif /* CONFIG_LKTR */ ++ ++#define TraceErr(e) do { \ ++ if (unlikely((e) < 0)) \ ++ LKTRTrace("err %d\n", (int)(e)); \ ++} while (0) ++#define TraceErrPtr(p) do { \ ++ if (IS_ERR(p)) \ ++ LKTRTrace("err %ld\n", PTR_ERR(p)); \ ++} while (0) ++#define TraceEnter() LKTRLabel(enter) ++ ++/* dirty macros for debug print, use with "%.*s" and caution */ ++#define LNPair(qstr) (qstr)->len,(qstr)->name ++#define DLNPair(d) LNPair(&(d)->d_name) ++ ++/* ---------------------------------------------------------------------- */ ++ ++#define Dpri(lvl, fmt, arg...) \ ++ printk(lvl AUFS_NAME " %s:%d:%s[%d]: " fmt, \ ++ __func__, __LINE__, current->comm, current->pid, ##arg) ++#define Dbg(fmt, arg...) Dpri(KERN_DEBUG, fmt, ##arg) ++#define Warn(fmt, arg...) Dpri(KERN_WARNING, fmt, ##arg) ++#define Warn1(fmt, arg...) do { \ ++ static unsigned char c; \ ++ if (!c++) Warn(fmt, ##arg); \ ++ } while (0) ++#define Err(fmt, arg...) Dpri(KERN_ERR, fmt, ##arg) ++#define Err1(fmt, arg...) do { \ ++ static unsigned char c; \ ++ if (!c++) Err(fmt, ##arg); \ ++ } while (0) ++#define IOErr(fmt, arg...) Err("I/O Error, " fmt, ##arg) ++#define IOErr1(fmt, arg...) do { \ ++ static unsigned char c; \ ++ if (!c++) IOErr(fmt, ##arg); \ ++ } while (0) ++#define IOErrWhck(fmt, arg...) Err("I/O Error, try whck. " fmt, ##arg) ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_DEBUG ++struct aufs_nhash; ++void au_dpri_whlist(struct aufs_nhash *whlist); ++struct aufs_vdir; ++void au_dpri_vdir(struct aufs_vdir *vdir); ++void au_dpri_inode(struct inode *inode); ++void au_dpri_dentry(struct dentry *dentry); ++void au_dpri_file(struct file *filp); ++void au_dpri_sb(struct super_block *sb); ++#define DbgWhlist(w) do{LKTRTrace(#w "\n"); au_dpri_whlist(w);}while(0) ++#define DbgVdir(v) do{LKTRTrace(#v "\n"); au_dpri_vdir(v);}while(0) ++#define DbgInode(i) do{LKTRTrace(#i "\n"); au_dpri_inode(i);}while(0) ++#define DbgDentry(d) do{LKTRTrace(#d "\n"); au_dpri_dentry(d);}while(0) ++#define DbgFile(f) do{LKTRTrace(#f "\n"); au_dpri_file(f);}while(0) ++#define DbgSb(sb) do{LKTRTrace(#sb "\n"); au_dpri_sb(sb);}while(0) ++void DbgSleep(int sec); ++#else ++#define DbgWhlist(w) /* */ ++#define DbgVdir(v) /* */ ++#define DbgInode(i) /* */ ++#define DbgDentry(d) /* */ ++#define DbgFile(f) /* */ ++#define DbgSb(sb) /* */ ++#define DbgSleep(sec) /* */ ++#endif ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_DEBUG_H__ */ +diff --git a/fs/aufs/dentry.c b/fs/aufs/dentry.c +new file mode 100755 +index 0000000..2acb89b +--- /dev/null ++++ b/fs/aufs/dentry.c +@@ -0,0 +1,946 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dentry.c,v 1.41 2007/05/14 03:38:38 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++//#include <linux/namei.h> ++#include "aufs.h" ++ ++#ifdef CONFIG_AUFS_LHASH_PATCH ++ ++#ifdef CONFIG_AUFS_DLGT ++struct lookup_hash_args { ++ struct dentry **errp; ++ struct qstr *name; ++ struct dentry *base; ++ struct nameidata *nd; ++}; ++ ++static void call_lookup_hash(void *args) ++{ ++ struct lookup_hash_args *a = args; ++ *a->errp = __lookup_hash(a->name, a->base, a->nd); ++} ++#endif /* CONFIG_AUFS_DLGT */ ++ ++static struct dentry *lkup_hash(const char *name, struct dentry *parent, ++ int len, struct lkup_args *lkup) ++{ ++ struct dentry *dentry; ++ char *p; ++ unsigned long hash; ++ struct qstr this; ++ unsigned int c; ++ struct nameidata tmp_nd; ++ ++ dentry = ERR_PTR(-EACCES); ++ this.name = name; ++ this.len = len; ++ if (unlikely(!len)) ++ goto out; ++ ++ p = (void*)name; ++ hash = init_name_hash(); ++ while (len--) { ++ c = *p++; ++ if (unlikely(c == '/' || c == '\0')) ++ goto out; ++ hash = partial_name_hash(c, hash); ++ } ++ this.hash = end_name_hash(hash); ++ ++ memset(&tmp_nd, 0, sizeof(tmp_nd)); ++ tmp_nd.dentry = dget(parent); ++ tmp_nd.mnt = mntget(lkup->nfsmnt); ++#ifndef CONFIG_AUFS_DLGT ++ dentry = __lookup_hash(&this, parent, &tmp_nd); ++#else ++ if (!lkup->dlgt) ++ dentry = __lookup_hash(&this, parent, &tmp_nd); ++ else { ++ struct lookup_hash_args args = { ++ .errp = &dentry, ++ .name = &this, ++ .base = parent, ++ .nd = &tmp_nd ++ }; ++ au_wkq_wait(call_lookup_hash, &args, /*dlgt*/1); ++ } ++#endif ++ path_release(&tmp_nd); ++ ++ out: ++ TraceErrPtr(dentry); ++ return dentry; ++} ++#elif defined(CONFIG_AUFS_DLGT) ++static struct dentry *lkup_hash(const char *name, struct dentry *parent, ++ int len, struct lkup_args *lkup) ++{ ++ return ERR_PTR(-ENOSYS); ++} ++#endif ++ ++#ifdef CONFIG_AUFS_DLGT ++struct lookup_one_len_args { ++ struct dentry **errp; ++ const char *name; ++ struct dentry *parent; ++ int len; ++}; ++ ++static void call_lookup_one_len(void *args) ++{ ++ struct lookup_one_len_args *a = args; ++ *a->errp = lookup_one_len(a->name, a->parent, a->len); ++} ++#endif /* CONFIG_AUFS_DLGT */ ++ ++#if defined(CONFIG_AUFS_LHASH_PATCH) || defined(CONFIG_AUFS_DLGT) ++/* cf. lookup_one_len() in linux/fs/namei.c */ ++struct dentry *lkup_one(const char *name, struct dentry *parent, int len, ++ struct lkup_args *lkup) ++{ ++ struct dentry *dentry; ++ ++ LKTRTrace("%.*s/%.*s, lkup{%p, %d}\n", ++ DLNPair(parent), len, name, lkup->nfsmnt, lkup->dlgt); ++ ++ if (!lkup->nfsmnt) { ++#ifndef CONFIG_AUFS_DLGT ++ dentry = lookup_one_len(name, parent, len); ++#else ++ if (!lkup->dlgt) ++ dentry = lookup_one_len(name, parent, len); ++ else { ++ struct lookup_one_len_args args = { ++ .errp = &dentry, ++ .name = name, ++ .parent = parent, ++ .len = len ++ }; ++ au_wkq_wait(call_lookup_one_len, &args, /*dlgt*/1); ++ } ++#endif ++ } else ++ dentry = lkup_hash(name, parent, len, lkup); ++ ++ TraceErrPtr(dentry); ++ return dentry; ++} ++#endif ++ ++struct lkup_one_args { ++ struct dentry **errp; ++ const char *name; ++ struct dentry *parent; ++ int len; ++ struct lkup_args *lkup; ++}; ++ ++static void call_lkup_one(void *args) ++{ ++ struct lkup_one_args *a = args; ++ *a->errp = lkup_one(a->name, a->parent, a->len, a->lkup); ++} ++ ++/* ++ * returns positive/negative dentry, NULL or an error. ++ * NULL means whiteout-ed or not-found. ++ */ ++static struct dentry *do_lookup(struct dentry *hidden_parent, ++ struct dentry *dentry, aufs_bindex_t bindex, ++ struct qstr *wh_name, int allow_neg, ++ mode_t type, int dlgt) ++{ ++ struct dentry *hidden_dentry; ++ int wh_found, wh_able, opq; ++ struct inode *hidden_dir, *hidden_inode; ++ struct qstr *name; ++ struct super_block *sb; ++ struct lkup_args lkup = {.dlgt = dlgt}; ++ ++ LKTRTrace("%.*s/%.*s, b%d, allow_neg %d, type 0%o, dlgt %d\n", ++ DLNPair(hidden_parent), DLNPair(dentry), bindex, allow_neg, ++ type, dlgt); ++ DEBUG_ON(IS_ROOT(dentry)); ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ ++ wh_found = 0; ++ sb = dentry->d_sb; ++ wh_able = sbr_is_whable(sb, bindex); ++ lkup.nfsmnt = au_nfsmnt(sb, bindex); ++ name = &dentry->d_name; ++ if (unlikely(wh_able)) { ++#if 0 //def CONFIG_AUFS_ROBR ++ if (strncmp(name->name, AUFS_WH_PFX, AUFS_WH_PFX_LEN)) ++ wh_found = is_wh(hidden_parent, wh_name, /*try_sio*/0, ++ &lkup); ++ else ++ wh_found = -EPERM; ++#else ++ wh_found = is_wh(hidden_parent, wh_name, /*try_sio*/0, &lkup); ++#endif ++ } ++ //if (LktrCond) wh_found = -1; ++ hidden_dentry = ERR_PTR(wh_found); ++ if (!wh_found) ++ goto real_lookup; ++ if (unlikely(wh_found < 0)) ++ goto out; ++ ++ /* We found a whiteout */ ++ //set_dbend(dentry, bindex); ++ set_dbwh(dentry, bindex); ++ if (!allow_neg) ++ return NULL; /* success */ ++ ++ real_lookup: ++ // do not superio. ++ hidden_dentry = lkup_one(name->name, hidden_parent, name->len, &lkup); ++ //if (LktrCond) {dput(hidden_dentry); hidden_dentry = ERR_PTR(-1);} ++ if (IS_ERR(hidden_dentry)) ++ goto out; ++ DEBUG_ON(d_unhashed(hidden_dentry)); ++ hidden_inode = hidden_dentry->d_inode; ++ if (!hidden_inode) { ++ if (!allow_neg) ++ goto out_neg; ++ } else if (wh_found ++ || (type && type != (hidden_inode->i_mode & S_IFMT))) ++ goto out_neg; ++ ++ if (dbend(dentry) <= bindex) ++ set_dbend(dentry, bindex); ++ if (dbstart(dentry) == -1 || bindex < dbstart(dentry)) ++ set_dbstart(dentry, bindex); ++ set_h_dptr(dentry, bindex, hidden_dentry); ++ ++ if (!hidden_inode || !S_ISDIR(hidden_inode->i_mode) || !wh_able) ++ return hidden_dentry; /* success */ ++ ++ hi_lock_child(hidden_inode); ++ opq = is_diropq(hidden_dentry, &lkup); ++ //if (LktrCond) opq = -1; ++ i_unlock(hidden_inode); ++ if (opq > 0) ++ set_dbdiropq(dentry, bindex); ++ else if (unlikely(opq < 0)) { ++ set_h_dptr(dentry, bindex, NULL); ++ hidden_dentry = ERR_PTR(opq); ++ } ++ goto out; ++ ++ out_neg: ++ dput(hidden_dentry); ++ hidden_dentry = NULL; ++ out: ++ TraceErrPtr(hidden_dentry); ++ return hidden_dentry; ++} ++ ++/* ++ * returns the number of hidden positive dentries, ++ * otherwise an error. ++ */ ++int lkup_dentry(struct dentry *dentry, aufs_bindex_t bstart, mode_t type) ++{ ++ int npositive, err, allow_neg, dlgt; ++ struct dentry *parent; ++ aufs_bindex_t bindex, btail; ++ const struct qstr *name = &dentry->d_name; ++ struct qstr whname; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, b%d, type 0%o\n", LNPair(name), bstart, type); ++ DEBUG_ON(bstart < 0 || IS_ROOT(dentry)); ++ parent = dget_parent(dentry); ++ ++#if 1 //ndef CONFIG_AUFS_ROBR ++ err = -EPERM; ++ if (unlikely(!strncmp(name->name, AUFS_WH_PFX, AUFS_WH_PFX_LEN))) ++ goto out; ++#endif ++ ++ err = au_alloc_whname(name->name, name->len, &whname); ++ //if (LktrCond) {au_free_whname(&whname); err = -1;} ++ if (unlikely(err)) ++ goto out; ++ ++ sb = dentry->d_sb; ++ dlgt = need_dlgt(sb); ++ allow_neg = !type; ++ npositive = 0; ++ btail = dbtaildir(parent); ++ for (bindex = bstart; bindex <= btail; bindex++) { ++ struct dentry *hidden_parent, *hidden_dentry; ++ struct inode *hidden_inode; ++ struct inode *hidden_dir; ++ ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (hidden_dentry) { ++ if (hidden_dentry->d_inode) ++ npositive++; ++ if (type != S_IFDIR) ++ break; ++ continue; ++ } ++ hidden_parent = au_h_dptr_i(parent, bindex); ++ if (!hidden_parent) ++ continue; ++ hidden_dir = hidden_parent->d_inode; ++ if (!hidden_dir || !S_ISDIR(hidden_dir->i_mode)) ++ continue; ++ ++ hi_lock_parent(hidden_dir); ++ hidden_dentry = do_lookup(hidden_parent, dentry, bindex, ++ &whname, allow_neg, type, dlgt); ++ // do not dput for testing ++ //if (LktrCond) {hidden_dentry = ERR_PTR(-1);} ++ i_unlock(hidden_dir); ++ err = PTR_ERR(hidden_dentry); ++ if (IS_ERR(hidden_dentry)) ++ goto out_wh; ++ allow_neg = 0; ++ ++ if (dbwh(dentry) != -1) ++ break; ++ if (!hidden_dentry) ++ continue; ++ hidden_inode = hidden_dentry->d_inode; ++ if (!hidden_inode) ++ continue; ++ npositive++; ++ if (!type) ++ type = hidden_inode->i_mode & S_IFMT; ++ if (type != S_IFDIR) ++ break; ++ else if (dbdiropq(dentry) != -1) ++ break; ++ } ++ ++ if (npositive) { ++ LKTRLabel(positive); ++ au_update_dbstart(dentry); ++ } ++ err = npositive; ++ ++ out_wh: ++ au_free_whname(&whname); ++ out: ++ dput(parent); ++ TraceErr(err); ++ return err; ++} ++ ++struct dentry *sio_lkup_one(const char *name, struct dentry *parent, int len, ++ struct lkup_args *lkup) ++{ ++ struct dentry *dentry; ++ ++ LKTRTrace("%.*s/%.*s\n", DLNPair(parent), len, name); ++ IMustLock(parent->d_inode); ++ ++ if (!au_test_perm(parent->d_inode, MAY_EXEC, lkup->dlgt)) ++ dentry = lkup_one(name, parent, len, lkup); ++ else { ++ // ugly ++ int dlgt = lkup->dlgt; ++ struct lkup_one_args args = { ++ .errp = &dentry, ++ .name = name, ++ .parent = parent, ++ .len = len, ++ .lkup = lkup ++ }; ++ ++ lkup->dlgt = 0; ++ au_wkq_wait(call_lkup_one, &args, /*dlgt*/0); ++ lkup->dlgt = dlgt; ++ } ++ ++ TraceErrPtr(dentry); ++ return dentry; ++} ++ ++/* ++ * lookup @dentry on @bindex which should be negative. ++ */ ++int lkup_neg(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ int err; ++ struct dentry *parent, *hidden_parent, *hidden_dentry; ++ struct inode *hidden_dir; ++ struct lkup_args lkup; ++ ++ LKTRTrace("%.*s, b%d\n", DLNPair(dentry), bindex); ++ parent = dget_parent(dentry); ++ DEBUG_ON(!parent || !parent->d_inode ++ || !S_ISDIR(parent->d_inode->i_mode)); ++ hidden_parent = au_h_dptr_i(parent, bindex); ++ DEBUG_ON(!hidden_parent); ++ hidden_dir = hidden_parent->d_inode; ++ DEBUG_ON(!hidden_dir || !S_ISDIR(hidden_dir->i_mode)); ++ IMustLock(hidden_dir); ++ ++ lkup.nfsmnt = au_nfsmnt(dentry->d_sb, bindex); ++ lkup.dlgt = need_dlgt(dentry->d_sb); ++ hidden_dentry = sio_lkup_one(dentry->d_name.name, hidden_parent, ++ dentry->d_name.len, &lkup); ++ //if (LktrCond) {dput(hidden_dentry); hidden_dentry = ERR_PTR(-1);} ++ err = PTR_ERR(hidden_dentry); ++ if (IS_ERR(hidden_dentry)) ++ goto out; ++ if (unlikely(hidden_dentry->d_inode)) { ++ err = -EIO; ++ IOErr("b%d %.*s should be negative.%s\n", ++ bindex, DLNPair(hidden_dentry), ++ au_flag_test(dentry->d_sb, AuFlag_UDBA_INOTIFY) ? "" : ++ " Try udba=inotify."); ++ dput(hidden_dentry); ++ goto out; ++ } ++ ++ if (bindex < dbstart(dentry)) ++ set_dbstart(dentry, bindex); ++ if (dbend(dentry) < bindex) ++ set_dbend(dentry, bindex); ++ set_h_dptr(dentry, bindex, hidden_dentry); ++ err = 0; ++ ++ out: ++ dput(parent); ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * returns the number of found hidden positive dentries, ++ * otherwise an error. ++ */ ++int au_refresh_hdentry(struct dentry *dentry, mode_t type) ++{ ++ int npositive, pgen, new_sz, sgen, dgen; ++ struct aufs_dinfo *dinfo; ++ struct super_block *sb; ++ struct dentry *parent; ++ aufs_bindex_t bindex, parent_bend, parent_bstart, bwh, bdiropq, bend; ++ struct aufs_hdentry *p; ++ //struct nameidata nd; ++ ++ LKTRTrace("%.*s, type 0%o\n", DLNPair(dentry), type); ++ DiMustWriteLock(dentry); ++ sb = dentry->d_sb; ++ DEBUG_ON(IS_ROOT(dentry)); ++ parent = dget_parent(dentry); ++ pgen = au_digen(parent); ++ sgen = au_sigen(sb); ++ dgen = au_digen(dentry); ++ DEBUG_ON(pgen != sgen); ++ ++ npositive = -ENOMEM; ++ new_sz = sizeof(*dinfo->di_hdentry) * (sbend(sb) + 1); ++ dinfo = dtodi(dentry); ++ p = au_kzrealloc(dinfo->di_hdentry, sizeof(*p) * (dinfo->di_bend + 1), ++ new_sz, GFP_KERNEL); ++ //p = NULL; ++ if (unlikely(!p)) ++ goto out; ++ dinfo->di_hdentry = p; ++ ++ bend = dinfo->di_bend; ++ bwh = dinfo->di_bwh; ++ bdiropq = dinfo->di_bdiropq; ++ p += dinfo->di_bstart; ++ for (bindex = dinfo->di_bstart; bindex <= bend; bindex++, p++) { ++ struct dentry *hd, *hdp; ++ struct aufs_hdentry tmp, *q; ++ aufs_bindex_t new_bindex; ++ ++ hd = p->hd_dentry; ++ if (!hd) ++ continue; ++ hdp = dget_parent(hd); ++ if (hdp == au_h_dptr_i(parent, bindex)) { ++ dput(hdp); ++ continue; ++ } ++ ++ new_bindex = au_find_dbindex(parent, hdp); ++ dput(hdp); ++ DEBUG_ON(new_bindex == bindex); ++ if (dinfo->di_bwh == bindex) ++ bwh = new_bindex; ++ if (dinfo->di_bdiropq == bindex) ++ bdiropq = new_bindex; ++ if (new_bindex < 0) { // test here ++ hdput(p); ++ p->hd_dentry = NULL; ++ continue; ++ } ++ /* swap two hidden dentries, and loop again */ ++ q = dinfo->di_hdentry + new_bindex; ++ tmp = *q; ++ *q = *p; ++ *p = tmp; ++ if (tmp.hd_dentry) { ++ bindex--; ++ p--; ++ } ++ } ++ ++ // test here ++ dinfo->di_bwh = -1; ++ if (unlikely(bwh != -1 && bwh <= sbend(sb) && sbr_is_whable(sb, bwh))) ++ dinfo->di_bwh = bwh; ++ dinfo->di_bdiropq = -1; ++ if (unlikely(bdiropq != -1 && bdiropq <= sbend(sb) ++ && sbr_is_whable(sb, bdiropq))) ++ dinfo->di_bdiropq = bdiropq; ++ parent_bend = dbend(parent); ++ p = dinfo->di_hdentry; ++ for (bindex = 0; bindex <= parent_bend; bindex++, p++) ++ if (p->hd_dentry) { ++ dinfo->di_bstart = bindex; ++ break; ++ } ++ p = dinfo->di_hdentry + parent_bend; ++ //for (bindex = parent_bend; bindex > dinfo->di_bstart; bindex--, p--) ++ for (bindex = parent_bend; bindex >= 0; bindex--, p--) ++ if (p->hd_dentry) { ++ dinfo->di_bend = bindex; ++ break; ++ } ++ ++ npositive = 0; ++ parent_bstart = dbstart(parent); ++ if (type != S_IFDIR && dinfo->di_bstart == parent_bstart) ++ goto out_dgen; /* success */ ++ ++#if 0 ++ nd.last_type = LAST_ROOT; ++ nd.flags = LOOKUP_FOLLOW; ++ nd.depth = 0; ++ nd.mnt = mntget(??); ++ nd.dentry = dget(parent); ++#endif ++ npositive = lkup_dentry(dentry, parent_bstart, type); ++ //if (LktrCond) npositive = -1; ++ if (npositive < 0) ++ goto out; ++ ++ out_dgen: ++ au_update_digen(dentry); ++ out: ++ dput(parent); ++ TraceErr(npositive); ++ return npositive; ++} ++ ++static int h_d_revalidate(struct dentry *dentry, struct nameidata *nd, ++ int do_udba) ++{ ++ int err, plus, locked, unhashed, is_root, h_plus, is_nfs; ++ struct nameidata fake_nd, *p; ++ aufs_bindex_t bindex, btail, bstart, ibs, ibe; ++ struct super_block *sb; ++ struct inode *inode, *first, *h_inode, *h_cached_inode; ++ umode_t mode, h_mode; ++ struct dentry *h_dentry; ++ int (*reval)(struct dentry *, struct nameidata *); ++ struct qstr *name; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ inode = dentry->d_inode; ++ DEBUG_ON(inode && au_digen(dentry) != au_iigen(inode)); ++ //DbgDentry(dentry); ++ //DbgInode(inode); ++ ++ err = 0; ++ sb = dentry->d_sb; ++ plus = 0; ++ mode = 0; ++ first = NULL; ++ ibs = ibe = -1; ++ unhashed = d_unhashed(dentry); ++ is_root = IS_ROOT(dentry); ++ name = &dentry->d_name; ++ ++ /* ++ * Theoretically, REVAL test should be unnecessary in case of INOTIFY. ++ * But inotify doesn't fire some necessary events, ++ * IN_ATTRIB for atime/nlink/pageio ++ * IN_DELETE for NFS dentry ++ * Let's do REVAL test too. ++ */ ++ if (do_udba && inode) { ++ mode = (inode->i_mode & S_IFMT); ++ plus = (inode->i_nlink > 0); ++ first = au_h_iptr(inode); ++ ibs = ibstart(inode); ++ ibe = ibend(inode); ++ } ++ ++ btail = bstart = dbstart(dentry); ++ if (inode && S_ISDIR(inode->i_mode)) ++ btail = dbtaildir(dentry); ++ locked = 0; ++ if (nd) { ++ fake_nd = *nd; ++#ifndef CONFIG_AUFS_FAKE_DM ++ if (dentry != nd->dentry) { ++ di_read_lock_parent(nd->dentry, 0); ++ locked = 1; ++ } ++#endif ++ } ++ for (bindex = bstart; bindex <= btail; bindex++) { ++ h_dentry = au_h_dptr_i(dentry, bindex); ++ if (unlikely(!h_dentry)) ++ continue; ++ if (unlikely(do_udba ++ && !is_root ++ && (unhashed != d_unhashed(h_dentry) ++#if 1 ++ || name->len != h_dentry->d_name.len ++ || memcmp(name->name, h_dentry->d_name.name, ++ name->len) ++#endif ++ ))) { ++ LKTRTrace("unhash 0x%x 0x%x, %.*s %.*s\n", ++ unhashed, d_unhashed(h_dentry), ++ DLNPair(dentry), DLNPair(h_dentry)); ++ goto err; ++ } ++ ++ reval = NULL; ++ if (h_dentry->d_op) ++ reval = h_dentry->d_op->d_revalidate; ++ if (unlikely(reval)) { ++ //LKTRLabel(hidden reval); ++ p = fake_dm(&fake_nd, nd, sb, bindex); ++ DEBUG_ON(IS_ERR(p)); ++ err = !reval(h_dentry, p); ++ fake_dm_release(p); ++ if (unlikely(err)) { ++ //Dbg("here\n"); ++ goto err; ++ } ++ } ++ ++ if (unlikely(!do_udba)) ++ continue; ++ ++ /* UDBA tests */ ++ h_inode = h_dentry->d_inode; ++ if (unlikely(!!inode != !!h_inode)) { ++ //Dbg("here\n"); ++ goto err; ++ } ++ ++ h_plus = plus; ++ h_mode = mode; ++ h_cached_inode = h_inode; ++ is_nfs = 0; ++ if (h_inode) { ++ h_mode = (h_inode->i_mode & S_IFMT); ++ h_plus = (h_inode->i_nlink > 0); ++ } ++ if (inode && ibs <= bindex && bindex <= ibe) { ++ h_cached_inode = au_h_iptr_i(inode, bindex); ++ //is_nfs = au_is_nfs(h_cached_inode->i_sb); ++ } ++ ++ LKTRTrace("{%d, 0%o, %p}, h{%d, 0%o, %p}\n", ++ plus, mode, h_cached_inode, ++ h_plus, h_mode, h_inode); ++ if (unlikely(plus != h_plus || mode != h_mode ++ || (h_cached_inode != h_inode /* && !is_nfs */))) { ++ //Dbg("here\n"); ++ goto err; ++ } ++ continue; ++ ++ err: ++ err = -EINVAL; ++ break; ++ } ++#ifndef CONFIG_AUFS_FAKE_DM ++ if (unlikely(locked)) ++ di_read_unlock(nd->dentry, 0); ++#endif ++ ++#if 0 ++ // some filesystem uses CURRENT_TIME_SEC instead of CURRENT_TIME. ++ // NFS may stop IN_DELETE because of DCACHE_NFSFS_RENAMED. ++#if 0 ++ && (!timespec_equal(&inode->i_ctime, &first->i_ctime) ++ || !timespec_equal(&inode->i_atime, &first->i_atime)) ++#endif ++ if (unlikely(!err && udba && first)) ++ au_cpup_attr_all(inode); ++#endif ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int simple_reval_dpath(struct dentry *dentry, int sgen) ++{ ++ int err; ++ mode_t type; ++ struct dentry *parent; ++ struct inode *inode; ++ ++ LKTRTrace("%.*s, sgen %d\n", DLNPair(dentry), sgen); ++ SiMustAnyLock(dentry->d_sb); ++ DiMustWriteLock(dentry); ++ inode = dentry->d_inode; ++ DEBUG_ON(!inode); ++ ++ if (au_digen(dentry) == sgen) ++ return 0; ++ ++ parent = dget_parent(dentry); ++ di_read_lock_parent(parent, AUFS_I_RLOCK); ++ DEBUG_ON(au_digen(parent) != sgen); ++#ifdef CONFIG_AUFS_DEBUG ++ { ++ struct dentry *d = parent; ++ while (!IS_ROOT(d)) { ++ DEBUG_ON(au_digen(d) != sgen); ++ d = d->d_parent; ++ } ++ } ++#endif ++ type = (inode->i_mode & S_IFMT); ++ /* returns a number of positive dentries */ ++ err = au_refresh_hdentry(dentry, type); ++ if (err >= 0) ++ err = au_refresh_hinode(inode, dentry); ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ dput(parent); ++ TraceErr(err); ++ return err; ++} ++ ++int au_reval_dpath(struct dentry *dentry, int sgen) ++{ ++ int err; ++ struct dentry *d, *parent; ++ struct inode *inode; ++ ++ LKTRTrace("%.*s, sgen %d\n", DLNPair(dentry), sgen); ++ DEBUG_ON(!dentry->d_inode); ++ DiMustWriteLock(dentry); ++ ++ if (!stosi(dentry->d_sb)->si_failed_refresh_dirs) ++ return simple_reval_dpath(dentry, sgen); ++ ++ /* slow loop, keep it simple and stupid */ ++ /* cf: cpup_dirs() */ ++ err = 0; ++ while (au_digen(dentry) != sgen) { ++ d = dentry; ++ while (1) { ++ parent = d->d_parent; // dget_parent() ++ if (au_digen(parent) == sgen) ++ break; ++ d = parent; ++ } ++ ++ inode = d->d_inode; ++ if (d != dentry) { ++ //i_lock(inode); ++ di_write_lock_child(d); ++ } ++ ++ /* someone might update our dentry while we were sleeping */ ++ if (au_digen(d) != sgen) { ++ di_read_lock_parent(parent, AUFS_I_RLOCK); ++ /* returns a number of positive dentries */ ++ err = au_refresh_hdentry(d, inode->i_mode & S_IFMT); ++ //err = -1; ++ if (err >= 0) ++ err = au_refresh_hinode(inode, d); ++ //err = -1; ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ } ++ ++ if (d != dentry) { ++ di_write_unlock(d); ++ //i_unlock(inode); ++ } ++ if (unlikely(err)) ++ break; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * THIS IS A BOOLEAN FUNCTION: returns 1 if valid, 0 otherwise. ++ * nfsd passes NULL as nameidata. ++ */ ++static int aufs_d_revalidate(struct dentry *dentry, struct nameidata *nd) ++{ ++ int valid, sgen, err, do_udba; ++ struct super_block *sb; ++ struct inode *inode; ++ ++ LKTRTrace("dentry %.*s\n", DLNPair(dentry)); ++ if (nd && nd->dentry) ++ LKTRTrace("nd %.*s\n", DLNPair(nd->dentry)); ++ //dir case: DEBUG_ON(dentry->d_parent != nd->dentry); ++ //remove failure case: DEBUG_ON(!IS_ROOT(dentry) && d_unhashed(dentry)); ++ DEBUG_ON(!dentry->d_fsdata); ++ //DbgDentry(dentry); ++ ++ err = -EINVAL; ++ inode = dentry->d_inode; ++ //DbgInode(inode); ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ sgen = au_sigen(sb); ++ if (au_digen(dentry) == sgen) ++ di_read_lock_child(dentry, !AUFS_I_RLOCK); ++ else { ++ DEBUG_ON(IS_ROOT(dentry)); ++#ifdef ForceInotify ++ Dbg("UDBA or digen, %.*s\n", DLNPair(dentry)); ++#endif ++ //i_lock(inode); ++ di_write_lock_child(dentry); ++ if (inode) ++ err = au_reval_dpath(dentry, sgen); ++ //err = -1; ++ di_downgrade_lock(dentry, AUFS_I_RLOCK); ++ //i_unlock(inode); ++ if (unlikely(err)) ++ goto out; ++ ii_read_unlock(inode); ++ DEBUG_ON(au_iigen(inode) != sgen); ++ } ++ ++ if (inode) { ++ if (au_iigen(inode) == sgen) ++ ii_read_lock_child(inode); ++ else { ++ DEBUG_ON(IS_ROOT(dentry)); ++#ifdef ForceInotify ++ Dbg("UDBA or survived, %.*s\n", DLNPair(dentry)); ++#endif ++ ii_write_lock_child(inode); ++ err = au_refresh_hinode(inode, dentry); ++ ii_downgrade_lock(inode); ++ if (unlikely(err)) ++ goto out; ++ DEBUG_ON(au_iigen(inode) != sgen); ++ } ++ } ++ ++#if 0 // fix it ++ /* parent dir i_nlink is not updated in the case of setattr */ ++ if (S_ISDIR(inode->i_mode)) { ++ i_lock(inode); ++ ii_write_lock(inode); ++ au_cpup_attr_nlink(inode); ++ ii_write_unlock(inode); ++ i_unlock(inode); ++ } ++#endif ++ ++ err = -EINVAL; ++ do_udba = !au_flag_test(sb, AuFlag_UDBA_NONE); ++ if (do_udba && inode && ibstart(inode) >= 0 ++ && au_test_higen(inode, au_h_iptr(inode))) ++ goto out; ++ err = h_d_revalidate(dentry, nd, do_udba); ++ //err = -1; ++ ++ out: ++ aufs_read_unlock(dentry, AUFS_I_RLOCK); ++ TraceErr(err); ++ valid = !err; ++ //au_debug_on(); ++ if (!valid) ++ LKTRTrace("%.*s invalid\n", DLNPair(dentry)); ++ //au_debug_off(); ++ return valid; ++} ++ ++static void aufs_d_release(struct dentry *dentry) ++{ ++ struct aufs_dinfo *dinfo; ++ aufs_bindex_t bend, bindex; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ DEBUG_ON(!d_unhashed(dentry)); ++ ++ dinfo = dentry->d_fsdata; ++ if (unlikely(!dinfo)) ++ return; ++ ++ /* dentry may not be revalidated */ ++ bindex = dinfo->di_bstart; ++ if (bindex >= 0) { ++ struct aufs_hdentry *p; ++ bend = dinfo->di_bend; ++ DEBUG_ON(bend < bindex); ++ p = dinfo->di_hdentry + bindex; ++ while (bindex++ <= bend) { ++ if (p->hd_dentry) ++ hdput(p); ++ p++; ++ } ++ } ++ kfree(dinfo->di_hdentry); ++ cache_free_dinfo(dinfo); ++} ++ ++#if 0 ++/* it may be called at remount time, too */ ++static void aufs_d_iput(struct dentry *dentry, struct inode *inode) ++{ ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, i%lu\n", DLNPair(dentry), inode->i_ino); ++ ++ sb = dentry->d_sb; ++#if 0 ++ si_read_lock(sb); ++ if (unlikely(au_flag_test(sb, AuFlag_PLINK) ++ && au_is_plinked(sb, inode))) { ++ ii_write_lock(inode); ++ au_update_brange(inode, 1); ++ ii_write_unlock(inode); ++ } ++ si_read_unlock(sb); ++#endif ++ iput(inode); ++} ++#endif ++ ++struct dentry_operations aufs_dop = { ++ .d_revalidate = aufs_d_revalidate, ++ .d_release = aufs_d_release ++ //.d_iput = aufs_d_iput ++}; +diff --git a/fs/aufs/dentry.h b/fs/aufs/dentry.h +new file mode 100755 +index 0000000..78049e3 +--- /dev/null ++++ b/fs/aufs/dentry.h +@@ -0,0 +1,183 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dentry.h,v 1.25 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_DENTRY_H__ ++#define __AUFS_DENTRY_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/aufs_type.h> ++#include "misc.h" ++ ++struct aufs_hdentry { ++ struct dentry *hd_dentry; ++}; ++ ++struct aufs_dinfo { ++ atomic_t di_generation; ++ ++ struct aufs_rwsem di_rwsem; ++ aufs_bindex_t di_bstart, di_bend, di_bwh, di_bdiropq; ++ struct aufs_hdentry *di_hdentry; ++}; ++ ++struct lkup_args { ++ struct vfsmount *nfsmnt; ++ int dlgt; ++ //struct super_block *sb; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* dentry.c */ ++#if defined(CONFIG_AUFS_LHASH_PATCH) || defined(CONFIG_AUFS_DLGT) ++struct dentry *lkup_one(const char *name, struct dentry *parent, int len, ++ struct lkup_args *lkup); ++#else ++static inline ++struct dentry *lkup_one(const char *name, struct dentry *parent, int len, ++ struct lkup_args *lkup) ++{ ++ return lookup_one_len(name, parent, len); ++} ++#endif ++ ++extern struct dentry_operations aufs_dop; ++struct dentry *sio_lkup_one(const char *name, struct dentry *parent, int len, ++ struct lkup_args *lkup); ++int lkup_dentry(struct dentry *dentry, aufs_bindex_t bstart, mode_t type); ++int lkup_neg(struct dentry *dentry, aufs_bindex_t bindex); ++int au_refresh_hdentry(struct dentry *dentry, mode_t type); ++int au_reval_dpath(struct dentry *dentry, int sgen); ++ ++/* dinfo.c */ ++int au_alloc_dinfo(struct dentry *dentry); ++struct aufs_dinfo *dtodi(struct dentry *dentry); ++ ++void di_read_lock(struct dentry *d, int flags, unsigned int lsc); ++void di_read_unlock(struct dentry *d, int flags); ++void di_downgrade_lock(struct dentry *d, int flags); ++void di_write_lock(struct dentry *d, unsigned int lsc); ++void di_write_unlock(struct dentry *d); ++void di_write_lock2_child(struct dentry *d1, struct dentry *d2, int isdir); ++void di_write_lock2_parent(struct dentry *d1, struct dentry *d2, int isdir); ++void di_write_unlock2(struct dentry *d1, struct dentry *d2); ++ ++aufs_bindex_t dbstart(struct dentry *dentry); ++aufs_bindex_t dbend(struct dentry *dentry); ++aufs_bindex_t dbwh(struct dentry *dentry); ++aufs_bindex_t dbdiropq(struct dentry *dentry); ++struct dentry *au_h_dptr_i(struct dentry *dentry, aufs_bindex_t bindex); ++struct dentry *au_h_dptr(struct dentry *dentry); ++ ++aufs_bindex_t dbtail(struct dentry *dentry); ++aufs_bindex_t dbtaildir(struct dentry *dentry); ++aufs_bindex_t dbtail_generic(struct dentry *dentry); ++ ++void set_dbstart(struct dentry *dentry, aufs_bindex_t bindex); ++void set_dbend(struct dentry *dentry, aufs_bindex_t bindex); ++void set_dbwh(struct dentry *dentry, aufs_bindex_t bindex); ++void set_dbdiropq(struct dentry *dentry, aufs_bindex_t bindex); ++void hdput(struct aufs_hdentry *hdentry); ++void set_h_dptr(struct dentry *dentry, aufs_bindex_t bindex, ++ struct dentry *h_dentry); ++ ++void au_update_digen(struct dentry *dentry); ++void au_update_dbstart(struct dentry *dentry); ++int au_find_dbindex(struct dentry *dentry, struct dentry *h_dentry); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline int au_digen(struct dentry *d) ++{ ++ return atomic_read(&dtodi(d)->di_generation); ++} ++ ++#ifdef CONFIG_AUFS_HINOTIFY ++static inline void au_digen_dec(struct dentry *d) ++{ ++ atomic_dec(&dtodi(d)->di_generation); ++} ++#endif /* CONFIG_AUFS_HINOTIFY */ ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* lock subclass for dinfo */ ++enum { ++ AuLsc_DI_CHILD, /* child first */ ++ AuLsc_DI_CHILD2, /* rename(2), link(2), and cpup at hinotify */ ++ AuLsc_DI_CHILD3, /* copyup dirs */ ++ AuLsc_DI_PARENT, ++ AuLsc_DI_PARENT2, ++ AuLsc_DI_PARENT3 ++}; ++ ++/* ++ * di_read_lock_child, di_write_lock_child, ++ * di_read_lock_child2, di_write_lock_child2, ++ * di_read_lock_child3, di_write_lock_child3, ++ * di_read_lock_parent, di_write_lock_parent, ++ * di_read_lock_parent2, di_write_lock_parent2, ++ * di_read_lock_parent3, di_write_lock_parent3, ++ */ ++#define ReadLockFunc(name, lsc) \ ++static inline void di_read_lock_##name(struct dentry *d, int flags) \ ++{di_read_lock(d, flags, AuLsc_DI_##lsc);} ++ ++#define WriteLockFunc(name, lsc) \ ++static inline void di_write_lock_##name(struct dentry *d) \ ++{di_write_lock(d, AuLsc_DI_##lsc);} ++ ++#define RWLockFuncs(name, lsc) \ ++ ReadLockFunc(name, lsc); \ ++ WriteLockFunc(name, lsc) ++ ++RWLockFuncs(child, CHILD); ++RWLockFuncs(child2, CHILD2); ++RWLockFuncs(child3, CHILD3); ++RWLockFuncs(parent, PARENT); ++RWLockFuncs(parent2, PARENT2); ++RWLockFuncs(parent3, PARENT3); ++ ++#undef ReadLockFunc ++#undef WriteLockFunc ++#undef RWLockFunc ++ ++/* to debug easier, do not make them inlined functions */ ++#define DiMustReadLock(d) do { \ ++ SiMustAnyLock((d)->d_sb); \ ++ RwMustReadLock(&dtodi(d)->di_rwsem); \ ++} while (0) ++ ++#define DiMustWriteLock(d) do { \ ++ SiMustAnyLock((d)->d_sb); \ ++ RwMustWriteLock(&dtodi(d)->di_rwsem); \ ++} while (0) ++ ++#define DiMustAnyLock(d) do { \ ++ SiMustAnyLock((d)->d_sb); \ ++ RwMustAnyLock(&dtodi(d)->di_rwsem); \ ++} while (0) ++ ++#define DiMustNoWaiters(d) RwMustNoWaiters(&dtodi(d)->di_rwsem) ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_DENTRY_H__ */ +diff --git a/fs/aufs/dinfo.c b/fs/aufs/dinfo.c +new file mode 100755 +index 0000000..6082149 +--- /dev/null ++++ b/fs/aufs/dinfo.c +@@ -0,0 +1,419 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dinfo.c,v 1.23 2007/05/07 03:43:36 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++int au_alloc_dinfo(struct dentry *dentry) ++{ ++ struct aufs_dinfo *dinfo; ++ struct super_block *sb; ++ int nbr; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ DEBUG_ON(dentry->d_fsdata); ++ ++ dinfo = cache_alloc_dinfo(); ++ //if (LktrCond) {cache_free_dinfo(dinfo); dinfo = NULL;} ++ if (dinfo) { ++ sb = dentry->d_sb; ++ nbr = sbend(sb) + 1; ++ if (unlikely(!nbr)) ++ nbr++; ++ dinfo->di_hdentry = kcalloc(nbr, sizeof(*dinfo->di_hdentry), ++ GFP_KERNEL); ++ //if (LktrCond) ++ //{kfree(dinfo->di_hdentry); dinfo->di_hdentry = NULL;} ++ if (dinfo->di_hdentry) { ++ rw_init_wlock_nested(&dinfo->di_rwsem, AuLsc_DI_PARENT); ++ dinfo->di_bstart = dinfo->di_bend = -1; ++ dinfo->di_bwh = dinfo->di_bdiropq = -1; ++ atomic_set(&dinfo->di_generation, au_sigen(sb)); ++ ++ dentry->d_fsdata = dinfo; ++ dentry->d_op = &aufs_dop; ++ return 0; /* success */ ++ } ++ cache_free_dinfo(dinfo); ++ } ++ TraceErr(-ENOMEM); ++ return -ENOMEM; ++} ++ ++struct aufs_dinfo *dtodi(struct dentry *dentry) ++{ ++ struct aufs_dinfo *dinfo = dentry->d_fsdata; ++ DEBUG_ON(!dinfo ++ || !dinfo->di_hdentry ++ /* || stosi(dentry->d_sb)->si_bend < dinfo->di_bend */ ++ || dinfo->di_bend < dinfo->di_bstart ++ /* dbwh can be outside of this range */ ++ || (0 <= dinfo->di_bdiropq ++ && (dinfo->di_bdiropq < dinfo->di_bstart ++ /* || dinfo->di_bend < dinfo->di_bdiropq */)) ++ ); ++ return dinfo; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void do_ii_write_lock(struct inode *inode, unsigned int lsc) ++{ ++ switch (lsc) { ++ case AuLsc_DI_CHILD: ++ ii_write_lock_child(inode); ++ break; ++ case AuLsc_DI_CHILD2: ++ ii_write_lock_child2(inode); ++ break; ++ case AuLsc_DI_CHILD3: ++ ii_write_lock_child3(inode); ++ break; ++ case AuLsc_DI_PARENT: ++ ii_write_lock_parent(inode); ++ break; ++ case AuLsc_DI_PARENT2: ++ ii_write_lock_parent2(inode); ++ break; ++ case AuLsc_DI_PARENT3: ++ ii_write_lock_parent3(inode); ++ break; ++ default: ++ BUG(); ++ } ++} ++ ++static void do_ii_read_lock(struct inode *inode, unsigned int lsc) ++{ ++ switch (lsc) { ++ case AuLsc_DI_CHILD: ++ ii_read_lock_child(inode); ++ break; ++ case AuLsc_DI_CHILD2: ++ ii_read_lock_child2(inode); ++ break; ++ case AuLsc_DI_CHILD3: ++ ii_read_lock_child3(inode); ++ break; ++ case AuLsc_DI_PARENT: ++ ii_read_lock_parent(inode); ++ break; ++ case AuLsc_DI_PARENT2: ++ ii_read_lock_parent2(inode); ++ break; ++ case AuLsc_DI_PARENT3: ++ ii_read_lock_parent3(inode); ++ break; ++ default: ++ BUG(); ++ } ++} ++ ++void di_read_lock(struct dentry *d, int flags, unsigned int lsc) ++{ ++ SiMustAnyLock(d->d_sb); ++ // todo: always nested? ++ rw_read_lock_nested(&dtodi(d)->di_rwsem, lsc); ++ if (d->d_inode) { ++ if (flags & AUFS_I_WLOCK) ++ do_ii_write_lock(d->d_inode, lsc); ++ else if (flags & AUFS_I_RLOCK) ++ do_ii_read_lock(d->d_inode, lsc); ++ } ++} ++ ++void di_read_unlock(struct dentry *d, int flags) ++{ ++ SiMustAnyLock(d->d_sb); ++ if (d->d_inode) { ++ if (flags & AUFS_I_WLOCK) ++ ii_write_unlock(d->d_inode); ++ else if (flags & AUFS_I_RLOCK) ++ ii_read_unlock(d->d_inode); ++ } ++ rw_read_unlock(&dtodi(d)->di_rwsem); ++} ++ ++void di_downgrade_lock(struct dentry *d, int flags) ++{ ++ SiMustAnyLock(d->d_sb); ++ rw_dgrade_lock(&dtodi(d)->di_rwsem); ++ if (d->d_inode && (flags & AUFS_I_RLOCK)) ++ ii_downgrade_lock(d->d_inode); ++} ++ ++void di_write_lock(struct dentry *d, unsigned int lsc) ++{ ++ SiMustAnyLock(d->d_sb); ++ // todo: always nested? ++ rw_write_lock_nested(&dtodi(d)->di_rwsem, lsc); ++ if (d->d_inode) ++ do_ii_write_lock(d->d_inode, lsc); ++} ++ ++void di_write_unlock(struct dentry *d) ++{ ++ SiMustAnyLock(d->d_sb); ++ if (d->d_inode) ++ ii_write_unlock(d->d_inode); ++ rw_write_unlock(&dtodi(d)->di_rwsem); ++} ++ ++void di_write_lock2_child(struct dentry *d1, struct dentry *d2, int isdir) ++{ ++ struct dentry *d; ++ ++ TraceEnter(); ++ DEBUG_ON(d1 == d2 ++ || d1->d_inode == d2->d_inode ++ || d1->d_sb != d2->d_sb); ++ ++ if (isdir) ++ for (d = d1; d->d_parent != d; d = d->d_parent) // dget_parent() ++ if (d->d_parent == d2) { ++ di_write_lock_child(d1); ++ di_write_lock_child2(d2); ++ return; ++ } ++ ++ di_write_lock_child(d2); ++ di_write_lock_child2(d1); ++} ++ ++void di_write_lock2_parent(struct dentry *d1, struct dentry *d2, int isdir) ++{ ++ struct dentry *d; ++ ++ TraceEnter(); ++ DEBUG_ON(d1 == d2 ++ || d1->d_inode == d2->d_inode ++ || d1->d_sb != d2->d_sb); ++ ++ if (isdir) ++ for (d = d1; d->d_parent != d; d = d->d_parent) // dget_parent() ++ if (d->d_parent == d2) { ++ di_write_lock_parent(d1); ++ di_write_lock_parent2(d2); ++ return; ++ } ++ ++ di_write_lock_parent(d2); ++ di_write_lock_parent2(d1); ++} ++ ++void di_write_unlock2(struct dentry *d1, struct dentry *d2) ++{ ++ di_write_unlock(d1); ++ if (d1->d_inode == d2->d_inode) ++ rw_write_unlock(&dtodi(d2)->di_rwsem); ++ else ++ di_write_unlock(d2); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++aufs_bindex_t dbstart(struct dentry *dentry) ++{ ++ DiMustAnyLock(dentry); ++ return dtodi(dentry)->di_bstart; ++} ++ ++aufs_bindex_t dbend(struct dentry *dentry) ++{ ++ DiMustAnyLock(dentry); ++ return dtodi(dentry)->di_bend; ++} ++ ++aufs_bindex_t dbwh(struct dentry *dentry) ++{ ++ DiMustAnyLock(dentry); ++ return dtodi(dentry)->di_bwh; ++} ++ ++aufs_bindex_t dbdiropq(struct dentry *dentry) ++{ ++ DiMustAnyLock(dentry); ++ DEBUG_ON(dentry->d_inode ++ && dentry->d_inode->i_mode ++ && !S_ISDIR(dentry->d_inode->i_mode)); ++ return dtodi(dentry)->di_bdiropq; ++} ++ ++struct dentry *au_h_dptr_i(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ struct dentry *d; ++ ++ DiMustAnyLock(dentry); ++ if (dbstart(dentry) < 0 || bindex < dbstart(dentry)) ++ return NULL; ++ DEBUG_ON(bindex < 0 ++ /* || bindex > sbend(dentry->d_sb) */); ++ d = dtodi(dentry)->di_hdentry[0 + bindex].hd_dentry; ++ DEBUG_ON(d && (atomic_read(&d->d_count) <= 0)); ++ return d; ++} ++ ++struct dentry *au_h_dptr(struct dentry *dentry) ++{ ++ return au_h_dptr_i(dentry, dbstart(dentry)); ++} ++ ++aufs_bindex_t dbtail(struct dentry *dentry) ++{ ++ aufs_bindex_t bend, bwh; ++ ++ bend = dbend(dentry); ++ if (0 <= bend) { ++ bwh = dbwh(dentry); ++ //DEBUG_ON(bend < bwh); ++ if (!bwh) ++ return bwh; ++ if (0 < bwh && bwh < bend) ++ return bwh - 1; ++ } ++ return bend; ++} ++ ++aufs_bindex_t dbtaildir(struct dentry *dentry) ++{ ++ aufs_bindex_t bend, bopq; ++ ++ DEBUG_ON(dentry->d_inode ++ && dentry->d_inode->i_mode ++ && !S_ISDIR(dentry->d_inode->i_mode)); ++ ++ bend = dbtail(dentry); ++ if (0 <= bend) { ++ bopq = dbdiropq(dentry); ++ DEBUG_ON(bend < bopq); ++ if (0 <= bopq && bopq < bend) ++ bend = bopq; ++ } ++ return bend; ++} ++ ++aufs_bindex_t dbtail_generic(struct dentry *dentry) ++{ ++ struct inode *inode; ++ ++ inode = dentry->d_inode; ++ if (inode && S_ISDIR(inode->i_mode)) ++ return dbtaildir(dentry); ++ else ++ return dbtail(dentry); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++// hard/soft set ++void set_dbstart(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ DiMustWriteLock(dentry); ++ DEBUG_ON(sbend(dentry->d_sb) < bindex); ++ /* */ ++ dtodi(dentry)->di_bstart = bindex; ++} ++ ++void set_dbend(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ DiMustWriteLock(dentry); ++ DEBUG_ON(sbend(dentry->d_sb) < bindex ++ || bindex < dbstart(dentry)); ++ dtodi(dentry)->di_bend = bindex; ++} ++ ++void set_dbwh(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ DiMustWriteLock(dentry); ++ DEBUG_ON(sbend(dentry->d_sb) < bindex); ++ /* dbwh can be outside of bstart - bend range */ ++ dtodi(dentry)->di_bwh = bindex; ++} ++ ++void set_dbdiropq(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ DiMustWriteLock(dentry); ++ DEBUG_ON(sbend(dentry->d_sb) < bindex); ++ DEBUG_ON((bindex != -1 ++ && (bindex < dbstart(dentry) || dbend(dentry) < bindex)) ++ || (dentry->d_inode ++ && dentry->d_inode->i_mode ++ && !S_ISDIR(dentry->d_inode->i_mode))); ++ dtodi(dentry)->di_bdiropq = bindex; ++} ++ ++void hdput(struct aufs_hdentry *hd) ++{ ++ dput(hd->hd_dentry); ++} ++ ++void set_h_dptr(struct dentry *dentry, aufs_bindex_t bindex, ++ struct dentry *h_dentry) ++{ ++ struct aufs_hdentry *hd = dtodi(dentry)->di_hdentry + bindex; ++ DiMustWriteLock(dentry); ++ DEBUG_ON(bindex < dtodi(dentry)->di_bstart ++ || bindex > dtodi(dentry)->di_bend ++ || (h_dentry && atomic_read(&h_dentry->d_count) <= 0) ++ || (h_dentry && hd->hd_dentry) ++ ); ++ if (hd->hd_dentry) ++ hdput(hd); ++ hd->hd_dentry = h_dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++void au_update_digen(struct dentry *dentry) ++{ ++ //DiMustWriteLock(dentry); ++ DEBUG_ON(!dentry->d_sb); ++ atomic_set(&dtodi(dentry)->di_generation, au_sigen(dentry->d_sb)); ++} ++ ++void au_update_dbstart(struct dentry *dentry) ++{ ++ aufs_bindex_t bindex, bstart = dbstart(dentry), bend = dbend(dentry); ++ struct dentry *hidden_dentry; ++ ++ DiMustWriteLock(dentry); ++ for (bindex = bstart; bindex <= bend; bindex++) { ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (!hidden_dentry) ++ continue; ++ if (hidden_dentry->d_inode) { ++ set_dbstart(dentry, bindex); ++ return; ++ } ++ set_h_dptr(dentry, bindex, NULL); ++ } ++ //set_dbstart(dentry, -1); ++ //set_dbend(dentry, -1); ++} ++ ++int au_find_dbindex(struct dentry *dentry, struct dentry *hidden_dentry) ++{ ++ aufs_bindex_t bindex, bend; ++ ++ bend = dbend(dentry); ++ for (bindex = dbstart(dentry); bindex <= bend; bindex++) ++ if (au_h_dptr_i(dentry, bindex) == hidden_dentry) ++ return bindex; ++ return -1; ++} +diff --git a/fs/aufs/dir.c b/fs/aufs/dir.c +new file mode 100755 +index 0000000..9afb1a9 +--- /dev/null ++++ b/fs/aufs/dir.c +@@ -0,0 +1,564 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dir.c,v 1.36 2007/05/14 03:38:52 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++static int reopen_dir(struct file *file) ++{ ++ int err; ++ struct dentry *dentry, *hidden_dentry; ++ aufs_bindex_t bindex, btail, bstart; ++ struct file *hidden_file; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ DEBUG_ON(!S_ISDIR(dentry->d_inode->i_mode)); ++ ++ /* open all hidden dirs */ ++ bstart = dbstart(dentry); ++#if 1 ++ for (bindex = fbstart(file); bindex < bstart; bindex++) ++ set_h_fptr(file, bindex, NULL); ++#endif ++ set_fbstart(file, bstart); ++ btail = dbtaildir(dentry); ++#if 1 ++ for (bindex = fbend(file); btail < bindex; bindex--) ++ set_h_fptr(file, bindex, NULL); ++#endif ++ set_fbend(file, btail); ++ for (bindex = bstart; bindex <= btail; bindex++) { ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (!hidden_dentry) ++ continue; ++ hidden_file = au_h_fptr_i(file, bindex); ++ if (hidden_file) { ++ DEBUG_ON(hidden_file->f_dentry != hidden_dentry); ++ continue; ++ } ++ ++ hidden_file = hidden_open(dentry, bindex, file->f_flags); ++ // unavailable ++ //if (LktrCond) {fput(hidden_file); ++ //br_put(stobr(dentry->d_sb, bindex));hidden_file=ERR_PTR(-1);} ++ err = PTR_ERR(hidden_file); ++ if (IS_ERR(hidden_file)) ++ goto out; // close all? ++ //cpup_file_flags(hidden_file, file); ++ set_h_fptr(file, bindex, hidden_file); ++ } ++ err = 0; ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static int do_open_dir(struct file *file, int flags) ++{ ++ int err; ++ aufs_bindex_t bindex, btail; ++ struct dentry *dentry, *hidden_dentry; ++ struct file *hidden_file; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, 0x%x\n", DLNPair(dentry), flags); ++ DEBUG_ON(!dentry->d_inode || !S_ISDIR(dentry->d_inode->i_mode)); ++ ++ err = 0; ++ set_fvdir_cache(file, NULL); ++ file->f_version = dentry->d_inode->i_version; ++ bindex = dbstart(dentry); ++ set_fbstart(file, bindex); ++ btail = dbtaildir(dentry); ++ set_fbend(file, btail); ++ for (; !err && bindex <= btail; bindex++) { ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (!hidden_dentry) ++ continue; ++ ++ hidden_file = hidden_open(dentry, bindex, flags); ++ //if (LktrCond) {fput(hidden_file); ++ //br_put(stobr(dentry->d_sb, bindex));hidden_file=ERR_PTR(-1);} ++ if (!IS_ERR(hidden_file)) { ++ set_h_fptr(file, bindex, hidden_file); ++ continue; ++ } ++ err = PTR_ERR(hidden_file); ++ } ++ if (!err) ++ return 0; /* success */ ++ ++ /* close all */ ++ for (bindex = fbstart(file); !err && bindex <= btail; bindex++) ++ set_h_fptr(file, bindex, NULL); ++ set_fbstart(file, -1); ++ set_fbend(file, -1); ++ return err; ++} ++ ++static int aufs_open_dir(struct inode *inode, struct file *file) ++{ ++ return au_do_open(inode, file, do_open_dir); ++} ++ ++static int aufs_release_dir(struct inode *inode, struct file *file) ++{ ++ struct aufs_vdir *vdir_cache; ++ struct super_block *sb; ++ ++ LKTRTrace("i%lu, %.*s\n", inode->i_ino, DLNPair(file->f_dentry)); ++ ++ sb = file->f_dentry->d_sb; ++ si_read_lock(sb); ++ fi_write_lock(file); ++ vdir_cache = fvdir_cache(file); ++ if (vdir_cache) ++ free_vdir(vdir_cache); ++ fi_write_unlock(file); ++ au_fin_finfo(file); ++ si_read_unlock(sb); ++ return 0; ++} ++ ++static int fsync_dir(struct dentry *dentry, int datasync) ++{ ++ int err; ++ struct inode *inode; ++ struct super_block *sb; ++ aufs_bindex_t bend, bindex; ++ ++ LKTRTrace("%.*s, %d\n", DLNPair(dentry), datasync); ++ DiMustAnyLock(dentry); ++ sb = dentry->d_sb; ++ SiMustAnyLock(sb); ++ inode = dentry->d_inode; ++ IMustLock(inode); ++ IiMustAnyLock(inode); ++ ++ err = 0; ++ bend = dbend(dentry); ++ for (bindex = dbstart(dentry); !err && bindex <= bend; bindex++) { ++ struct dentry *h_dentry; ++ struct inode *h_inode; ++ struct file_operations *fop; ++ ++ if (test_ro(sb, bindex, inode)) ++ continue; ++ h_dentry = au_h_dptr_i(dentry, bindex); ++ if (!h_dentry) ++ continue; ++ h_inode = h_dentry->d_inode; ++ if (!h_inode) ++ continue; ++ ++ /* cf. fs/nsfd/vfs.c and fs/nfsd/nfs4recover.c */ ++ //hdir_lock(h_inode, inode, bindex); ++ i_lock(h_inode); ++ fop = (void*)h_inode->i_fop; ++ err = filemap_fdatawrite(h_inode->i_mapping); ++ if (!err && fop && fop->fsync) ++ err = fop->fsync(NULL, h_dentry, datasync); ++ if (!err) ++ err = filemap_fdatawrite(h_inode->i_mapping); ++ //hdir_unlock(h_inode, inode, bindex); ++ i_unlock(h_inode); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * @file may be NULL ++ */ ++static int aufs_fsync_dir(struct file *file, struct dentry *dentry, ++ int datasync) ++{ ++ int err; ++ struct inode *inode; ++ struct file *hidden_file; ++ struct super_block *sb; ++ aufs_bindex_t bend, bindex; ++ ++ LKTRTrace("%.*s, %d\n", DLNPair(dentry), datasync); ++ inode = dentry->d_inode; ++ IMustLock(inode); ++ ++ err = 0; ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ if (file) { ++ err = au_reval_and_lock_finfo(file, reopen_dir, /*wlock*/1, ++ /*locked*/1); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ } else ++ di_read_lock_child(dentry, !AUFS_I_WLOCK); ++ ++ ii_write_lock_child(inode); ++ if (file) { ++ bend = fbend(file); ++ for (bindex = fbstart(file); !err && bindex <= bend; bindex++) { ++ hidden_file = au_h_fptr_i(file, bindex); ++ if (!hidden_file || test_ro(sb, bindex, inode)) ++ continue; ++ ++ err = -EINVAL; ++ if (hidden_file->f_op && hidden_file->f_op->fsync) { ++ // todo: try do_fsync() in fs/sync.c ++#if 0 ++ DEBUG_ON(hidden_file->f_dentry->d_inode ++ != au_h_iptr_i(inode, bindex)); ++ hdir_lock(hidden_file->f_dentry->d_inode, inode, ++ bindex); ++#else ++ i_lock(hidden_file->f_dentry->d_inode); ++#endif ++ err = hidden_file->f_op->fsync ++ (hidden_file, hidden_file->f_dentry, ++ datasync); ++ //err = -1; ++#if 0 ++ hdir_unlock(hidden_file->f_dentry->d_inode, ++ inode, bindex); ++#else ++ i_unlock(hidden_file->f_dentry->d_inode); ++#endif ++ } ++ } ++ } else ++ err = fsync_dir(dentry, datasync); ++ au_cpup_attr_timesizes(inode); ++ ii_write_unlock(inode); ++ if (file) ++ fi_write_unlock(file); ++ else ++ di_read_unlock(dentry, !AUFS_I_WLOCK); ++ ++ out: ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int aufs_readdir(struct file *file, void *dirent, filldir_t filldir) ++{ ++ int err; ++ struct dentry *dentry; ++ struct inode *inode; ++ struct super_block *sb; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, pos %Ld\n", DLNPair(dentry), file->f_pos); ++ inode = dentry->d_inode; ++ IMustLock(inode); ++ ++ au_nfsd_lockdep_off(); ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, reopen_dir, /*wlock*/1, ++ /*locked*/1); ++ if (unlikely(err)) ++ goto out; ++ ++ ii_write_lock_child(inode); ++ err = au_init_vdir(file); ++ if (unlikely(err)) { ++ ii_write_unlock(inode); ++ goto out_unlock; ++ } ++ //DbgVdir(fvdir_cache(file));// goto out_unlock; ++ ++ /* nfsd filldir calls lookup_one_len(). */ ++ ii_downgrade_lock(inode); ++ err = au_fill_de(file, dirent, filldir); ++ //DbgVdir(fvdir_cache(file));// goto out_unlock; ++ ++ inode->i_atime = au_h_iptr(inode)->i_atime; ++ ii_read_unlock(inode); ++ ++ out_unlock: ++ fi_write_unlock(file); ++ out: ++ si_read_unlock(sb); ++ au_nfsd_lockdep_on(); ++#if 0 // debug ++ if (LktrCond) ++ igrab(inode); ++#endif ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct test_empty_arg { ++ struct aufs_nhash *whlist; ++ int whonly; ++ aufs_bindex_t bindex; ++ int err, called; ++}; ++ ++static int test_empty_cb(void *__arg, const char *__name, int namelen, ++ loff_t offset, filldir_ino_t ino, unsigned int d_type) ++{ ++ struct test_empty_arg *arg = __arg; ++ char *name = (void*)__name; ++ ++ LKTRTrace("%.*s\n", namelen, name); ++ ++ arg->err = 0; ++ arg->called++; ++ //smp_mb(); ++ if (name[0] == '.' ++ && (namelen == 1 || (name[1] == '.' && namelen == 2))) ++ return 0; /* success */ ++ ++ if (namelen <= AUFS_WH_PFX_LEN ++ || memcmp(name, AUFS_WH_PFX, AUFS_WH_PFX_LEN)) { ++ if (arg->whonly && !test_known_wh(arg->whlist, name, namelen)) ++ arg->err = -ENOTEMPTY; ++ goto out; ++ } ++ ++ name += AUFS_WH_PFX_LEN; ++ namelen -= AUFS_WH_PFX_LEN; ++ if (!test_known_wh(arg->whlist, name, namelen)) ++ arg->err = append_wh(arg->whlist, name, namelen, arg->bindex); ++ ++ out: ++ //smp_mb(); ++ TraceErr(arg->err); ++ return arg->err; ++} ++ ++static int do_test_empty(struct dentry *dentry, struct test_empty_arg *arg) ++{ ++ int err, dlgt; ++ struct file *hidden_file; ++ ++ LKTRTrace("%.*s, {%p, %d, %d}\n", ++ DLNPair(dentry), arg->whlist, arg->whonly, arg->bindex); ++ ++ hidden_file = hidden_open(dentry, arg->bindex, ++ O_RDONLY | O_NONBLOCK | O_DIRECTORY ++ | O_LARGEFILE); ++ err = PTR_ERR(hidden_file); ++ if (IS_ERR(hidden_file)) ++ goto out; ++ ++ dlgt = need_dlgt(dentry->d_sb); ++ //hidden_file->f_pos = 0; ++ do { ++ arg->err = 0; ++ arg->called = 0; ++ //smp_mb(); ++ err = vfsub_readdir(hidden_file, test_empty_cb, arg, dlgt); ++ if (err >= 0) ++ err = arg->err; ++ } while (!err && arg->called); ++ fput(hidden_file); ++ sbr_put(dentry->d_sb, arg->bindex); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++struct do_test_empty_args { ++ int *errp; ++ struct dentry *dentry; ++ struct test_empty_arg *arg; ++}; ++ ++static void call_do_test_empty(void *args) ++{ ++ struct do_test_empty_args *a = args; ++ *a->errp = do_test_empty(a->dentry, a->arg); ++} ++ ++static int sio_test_empty(struct dentry *dentry, struct test_empty_arg *arg) ++{ ++ int err; ++ struct dentry *hidden_dentry; ++ struct inode *hidden_inode; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ hidden_dentry = au_h_dptr_i(dentry, arg->bindex); ++ DEBUG_ON(!hidden_dentry); ++ hidden_inode = hidden_dentry->d_inode; ++ DEBUG_ON(!hidden_inode || !S_ISDIR(hidden_inode->i_mode)); ++ ++ hi_lock_child(hidden_inode); ++ err = au_test_perm(hidden_inode, MAY_EXEC | MAY_READ, ++ need_dlgt(dentry->d_sb)); ++ i_unlock(hidden_inode); ++ if (!err) ++ err = do_test_empty(dentry, arg); ++ else { ++ struct do_test_empty_args args = { ++ .errp = &err, ++ .dentry = dentry, ++ .arg = arg ++ }; ++ au_wkq_wait(call_do_test_empty, &args, /*dlgt*/0); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++int au_test_empty_lower(struct dentry *dentry) ++{ ++ int err; ++ struct inode *inode; ++ struct test_empty_arg arg; ++ struct aufs_nhash *whlist; ++ aufs_bindex_t bindex, bstart, btail; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ inode = dentry->d_inode; ++ DEBUG_ON(!inode || !S_ISDIR(inode->i_mode)); ++ ++ whlist = nhash_new(GFP_KERNEL); ++ err = PTR_ERR(whlist); ++ if (IS_ERR(whlist)) ++ goto out; ++ ++ bstart = dbstart(dentry); ++ arg.whlist = whlist; ++ arg.whonly = 0; ++ arg.bindex = bstart; ++ err = do_test_empty(dentry, &arg); ++ if (unlikely(err)) ++ goto out_whlist; ++ ++ arg.whonly = 1; ++ btail = dbtaildir(dentry); ++ for (bindex = bstart + 1; !err && bindex <= btail; bindex++) { ++ struct dentry *hidden_dentry; ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (hidden_dentry && hidden_dentry->d_inode) { ++ DEBUG_ON(!S_ISDIR(hidden_dentry->d_inode->i_mode)); ++ arg.bindex = bindex; ++ err = do_test_empty(dentry, &arg); ++ } ++ } ++ ++ out_whlist: ++ nhash_del(whlist); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++int test_empty(struct dentry *dentry, struct aufs_nhash *whlist) ++{ ++ int err; ++ struct inode *inode; ++ struct test_empty_arg arg; ++ aufs_bindex_t bindex, btail; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ inode = dentry->d_inode; ++ DEBUG_ON(!inode || !S_ISDIR(inode->i_mode)); ++ ++ err = 0; ++ arg.whlist = whlist; ++ arg.whonly = 1; ++ btail = dbtaildir(dentry); ++ for (bindex = dbstart(dentry); !err && bindex <= btail; bindex++) { ++ struct dentry *hidden_dentry; ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (hidden_dentry && hidden_dentry->d_inode) { ++ DEBUG_ON(!S_ISDIR(hidden_dentry->d_inode->i_mode)); ++ arg.bindex = bindex; ++ err = sio_test_empty(dentry, &arg); ++ } ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++void au_add_nlink(struct inode *dir, struct inode *h_dir) ++{ ++ DEBUG_ON(!S_ISDIR(dir->i_mode) || !S_ISDIR(h_dir->i_mode)); ++ dir->i_nlink += h_dir->i_nlink - 2; ++ if (unlikely(h_dir->i_nlink < 2)) ++ dir->i_nlink += 2; ++} ++ ++void au_sub_nlink(struct inode *dir, struct inode *h_dir) ++{ ++ DEBUG_ON(!S_ISDIR(dir->i_mode) || !S_ISDIR(h_dir->i_mode)); ++ dir->i_nlink -= h_dir->i_nlink - 2; ++ if (unlikely(h_dir->i_nlink < 2)) ++ dir->i_nlink -= 2; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#if 0 // comment ++struct file_operations { ++ struct module *owner; ++ loff_t (*llseek) (struct file *, loff_t, int); ++ ssize_t (*read) (struct file *, char __user *, size_t, loff_t *); ++ ssize_t (*aio_read) (struct kiocb *, char __user *, size_t, loff_t); ++ ssize_t (*write) (struct file *, const char __user *, size_t, loff_t *); ++ ssize_t (*aio_write) (struct kiocb *, const char __user *, size_t, loff_t); ++ int (*readdir) (struct file *, void *, filldir_t); ++ unsigned int (*poll) (struct file *, struct poll_table_struct *); ++ int (*ioctl) (struct inode *, struct file *, unsigned int, unsigned long); ++ long (*unlocked_ioctl) (struct file *, unsigned int, unsigned long); ++ long (*compat_ioctl) (struct file *, unsigned int, unsigned long); ++ int (*mmap) (struct file *, struct vm_area_struct *); ++ int (*open) (struct inode *, struct file *); ++ int (*flush) (struct file *); ++ int (*release) (struct inode *, struct file *); ++ int (*fsync) (struct file *, struct dentry *, int datasync); ++ int (*aio_fsync) (struct kiocb *, int datasync); ++ int (*fasync) (int, struct file *, int); ++ int (*lock) (struct file *, int, struct file_lock *); ++ ssize_t (*readv) (struct file *, const struct iovec *, unsigned long, loff_t *); ++ ssize_t (*writev) (struct file *, const struct iovec *, unsigned long, loff_t *); ++ ssize_t (*sendfile) (struct file *, loff_t *, size_t, read_actor_t, void *); ++ ssize_t (*sendpage) (struct file *, struct page *, int, size_t, loff_t *, int); ++ unsigned long (*get_unmapped_area)(struct file *, unsigned long, unsigned long, unsigned long, unsigned long); ++ int (*check_flags)(int); ++ int (*dir_notify)(struct file *file, unsigned long arg); ++ int (*flock) (struct file *, int, struct file_lock *); ++}; ++#endif ++ ++struct file_operations aufs_dir_fop = { ++ .read = generic_read_dir, ++ .readdir = aufs_readdir, ++ .open = aufs_open_dir, ++ .release = aufs_release_dir, ++ .flush = aufs_flush, ++ .fsync = aufs_fsync_dir, ++}; +diff --git a/fs/aufs/dir.h b/fs/aufs/dir.h +new file mode 100755 +index 0000000..3ddf309 +--- /dev/null ++++ b/fs/aufs/dir.h +@@ -0,0 +1,125 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: dir.h,v 1.18 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_DIR_H__ ++#define __AUFS_DIR_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,19) ++#define filldir_ino_t u64 ++#else ++#define filldir_ino_t ino_t ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* need to be faster and smaller */ ++ ++#define AUFS_DEBLK_SIZE 512 // todo: changable ++#define AUFS_NHASH_SIZE 32 // todo: changable ++#if AUFS_DEBLK_SIZE < NAME_MAX || PAGE_SIZE < AUFS_DEBLK_SIZE ++#error invalid size AUFS_DEBLK_SIZE ++#endif ++ ++typedef char aufs_deblk_t[AUFS_DEBLK_SIZE]; ++ ++struct aufs_nhash { ++ struct hlist_head heads[AUFS_NHASH_SIZE]; ++}; ++ ++struct aufs_destr { ++ unsigned char len; ++ char name[0]; ++} __attribute__ ((packed)); ++ ++struct aufs_dehstr { ++ struct hlist_node hash; ++ struct aufs_destr *str; ++}; ++ ++struct aufs_de { ++ ino_t de_ino; ++ unsigned char de_type; ++ //caution: packed ++ struct aufs_destr de_str; ++} __attribute__ ((packed)); ++ ++struct aufs_wh { ++ struct hlist_node wh_hash; ++ aufs_bindex_t wh_bindex; ++ struct aufs_destr wh_str; ++} __attribute__ ((packed)); ++ ++union aufs_deblk_p { ++ unsigned char *p; ++ aufs_deblk_t *deblk; ++ struct aufs_de *de; ++}; ++ ++struct aufs_vdir { ++ aufs_deblk_t **vd_deblk; ++ int vd_nblk; ++ struct { ++ int i; ++ union aufs_deblk_p p; ++ } vd_last; ++ ++ unsigned long vd_version; ++ unsigned long vd_jiffy; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* dir.c */ ++extern struct file_operations aufs_dir_fop; ++int au_test_empty_lower(struct dentry *dentry); ++int test_empty(struct dentry *dentry, struct aufs_nhash *whlist); ++void au_add_nlink(struct inode *dir, struct inode *h_dir); ++void au_sub_nlink(struct inode *dir, struct inode *h_dir); ++ ++/* vdir.c */ ++struct aufs_nhash *nhash_new(gfp_t gfp); ++void nhash_del(struct aufs_nhash *nhash); ++void nhash_init(struct aufs_nhash *nhash); ++void nhash_move(struct aufs_nhash *dst, struct aufs_nhash *src); ++void nhash_fin(struct aufs_nhash *nhash); ++int is_longer_wh(struct aufs_nhash *whlist, aufs_bindex_t btgt, int limit); ++int test_known_wh(struct aufs_nhash *whlist, char *name, int namelen); ++int append_wh(struct aufs_nhash *whlist, char *name, int namelen, ++ aufs_bindex_t bindex); ++void free_vdir(struct aufs_vdir *vdir); ++int au_init_vdir(struct file *file); ++int au_fill_de(struct file *file, void *dirent, filldir_t filldir); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline ++unsigned int au_name_hash(const unsigned char *name, unsigned int len) ++{ ++ return (full_name_hash(name, len) % AUFS_NHASH_SIZE); ++} ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_DIR_H__ */ +diff --git a/fs/aufs/export.c b/fs/aufs/export.c +new file mode 100755 +index 0000000..7b1c6ac +--- /dev/null ++++ b/fs/aufs/export.c +@@ -0,0 +1,585 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: export.c,v 1.7 2007/05/14 03:38:24 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++extern struct export_operations export_op_default; ++#define CALL(ops, func) (((ops)->func) ? ((ops)->func) : export_op_default.func) ++#define is_anon(d) ((d)->d_flags & DCACHE_DISCONNECTED) ++ ++union conv { ++#if BITS_PER_LONG == 32 ++ __u32 a[1]; ++#else ++ __u32 a[2]; ++#endif ++ ino_t ino; ++}; ++ ++static ino_t decode_ino(__u32 *a) ++{ ++ union conv u; ++ u.a[0] = a[0]; ++#if BITS_PER_LONG == 64 ++ u.a[1] = a[1]; ++#endif ++ return u.ino; ++} ++ ++static void encode_ino(__u32 *a, ino_t ino) ++{ ++ union conv u; ++ u.ino = ino; ++ a[0] = u.a[0]; ++#if BITS_PER_LONG == 64 ++ a[1] = u.a[1]; ++#endif ++} ++ ++static void decode_br_id_sigen(__u32 a, aufs_bindex_t *br_id, ++ aufs_bindex_t *sigen) ++{ ++ BUILD_BUG_ON((sizeof(*br_id) + sizeof(*sigen)) > sizeof(a)); ++ *br_id = a >> 16; ++ DEBUG_ON(*br_id < 0); ++ *sigen = a; ++ DEBUG_ON(*sigen < 0); ++} ++ ++static __u32 encode_br_id_sigen(aufs_bindex_t br_id, aufs_bindex_t sigen) ++{ ++ DEBUG_ON(br_id < 0 || sigen < 0); ++ return (br_id << 16) | sigen; ++} ++ ++/* NFS file handle */ ++enum { ++ /* support 64bit inode number */ ++ /* but untested */ ++ Fh_br_id_sigen, ++ Fh_ino1, ++#if BITS_PER_LONG == 64 ++ Fh_ino2, ++#endif ++ Fh_dir_ino1, ++#if BITS_PER_LONG == 64 ++ Fh_dir_ino2, ++#endif ++ Fh_h_ino1, ++#if BITS_PER_LONG == 64 ++ Fh_h_ino2, ++#endif ++ Fh_h_igen, ++ Fh_h_type, ++ Fh_tail, ++ ++ Fh_ino = Fh_ino1, ++ Fh_dir_ino = Fh_dir_ino1, ++ Fh_h_ino = Fh_h_ino1, ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++static struct dentry *decode_by_ino(struct super_block *sb, ino_t ino, ++ ino_t dir_ino) ++{ ++ struct dentry *dentry; ++ struct inode *inode; ++ ++ LKTRTrace("i%lu, diri%lu\n", ino, dir_ino); ++ ++ dentry = NULL; ++ inode = ilookup(sb, ino); ++ if (unlikely(!inode)) ++ goto out; ++ ++ dentry = ERR_PTR(-ESTALE); ++ if (unlikely(is_bad_inode(inode))) ++ goto out_iput; ++ ++ dentry = NULL; ++ if (!S_ISDIR(inode->i_mode)) { ++ struct dentry *d; ++ spin_lock(&dcache_lock); ++ list_for_each_entry(d, &inode->i_dentry, d_alias) ++ if (!is_anon(d) ++ && d->d_parent->d_inode->i_ino == dir_ino) { ++ dentry = dget_locked(d); ++ break; ++ } ++ spin_unlock(&dcache_lock); ++ } else { ++ dentry = d_find_alias(inode); ++ if (dentry ++ && !is_anon(dentry) ++ && dentry->d_parent->d_inode->i_ino == dir_ino) ++ goto out_iput; /* success */ ++ ++ dput(dentry); ++ dentry = NULL; ++ } ++ ++ out_iput: ++ iput(inode); ++ out: ++ TraceErrPtr(dentry); ++ return dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct find_name_by_ino { ++ int called, found; ++ ino_t ino; ++ char *name; ++ int namelen; ++}; ++ ++static int ++find_name_by_ino(void *arg, const char *name, int namelen, loff_t offset, ++ filldir_ino_t ino, unsigned int d_type) ++{ ++ struct find_name_by_ino *a = arg; ++ ++ a->called++; ++ if (a->ino != ino) ++ return 0; ++ ++ memcpy(a->name, name, namelen); ++ a->namelen = namelen; ++ a->found = 1; ++ return 1; ++} ++ ++static struct dentry *decode_by_dir_ino(struct super_block *sb, ino_t ino, ++ ino_t dir_ino) ++{ ++ struct dentry *dentry, *parent; ++ struct inode *dir; ++ struct find_name_by_ino arg; ++ struct file *file; ++ int err; ++ ++ LKTRTrace("i%lu, diri%lu\n", ino, dir_ino); ++ ++ dentry = NULL; ++ dir = ilookup(sb, dir_ino); ++ if (unlikely(!dir)) ++ goto out; ++ ++ dentry = ERR_PTR(-ESTALE); ++ if (unlikely(is_bad_inode(dir))) ++ goto out_iput; ++ ++ dentry = NULL; ++ parent = d_find_alias(dir); ++ if (parent) { ++ if (unlikely(is_anon(parent))) { ++ dput(parent); ++ goto out_iput; ++ } ++ } else ++ goto out_iput; ++ ++ file = dentry_open(parent, NULL, au_dir_roflags); ++ dentry = (void*)file; ++ if (IS_ERR(file)) ++ goto out_iput; ++ ++ dentry = ERR_PTR(-ENOMEM); ++ arg.name = __getname(); ++ if (unlikely(!arg.name)) ++ goto out_fput; ++ arg.ino = ino; ++ arg.found = 0; ++ ++ do { ++ arg.called = 0; ++ //smp_mb(); ++ err = vfsub_readdir(file, find_name_by_ino, &arg, /*dlgt*/0); ++ } while (!err && !arg.found && arg.called); ++ dentry = ERR_PTR(err); ++ if (arg.found) { ++ /* do not call lkup_one(), nor dlgt */ ++ i_lock(dir); ++ dentry = lookup_one_len(arg.name, parent, arg.namelen); ++ i_unlock(dir); ++ TraceErrPtr(dentry); ++ } ++ ++ //out_putname: ++ __putname(arg.name); ++ out_fput: ++ fput(file); ++ out_iput: ++ iput(dir); ++ out: ++ TraceErrPtr(dentry); ++ return dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct append_name { ++ int found, called, len; ++ char *h_path; ++ ino_t h_ino; ++}; ++ ++static int append_name(void *arg, const char *name, int len, loff_t pos, ++ filldir_ino_t ino, unsigned int d_type) ++{ ++ struct append_name *a = arg; ++ char *p; ++ ++ a->called++; ++ if (ino != a->h_ino) ++ return 0; ++ ++ DEBUG_ON(len == 1 && *name == '.'); ++ DEBUG_ON(len == 2 && name[0] == '.' && name[1] == '.'); ++ a->len = strlen(a->h_path); ++ memmove(a->h_path - a->len - 1, a->h_path, a->len); ++ a->h_path -= a->len + 1; ++ p = a->h_path + a->len; ++ *p++ = '/'; ++ memcpy(p, name, a->len); ++ a->len += 1 + len; ++ a->found++; ++ return 1; ++} ++ ++static int h_acceptable(void *expv, struct dentry *dentry) ++{ ++ return 1; ++} ++ ++static struct dentry* ++decode_by_path(struct super_block *sb, aufs_bindex_t bindex, __u32 *fh, ++ int fh_len, void *context) ++{ ++ struct dentry *dentry, *h_parent, *root, *h_root; ++ struct super_block *h_sb; ++ char *path, *p; ++ struct vfsmount *h_mnt; ++ struct append_name arg; ++ int len, err; ++ struct file *h_file; ++ struct nameidata nd; ++ struct aufs_branch *br; ++ ++ LKTRTrace("b%d\n", bindex); ++ SiMustAnyLock(sb); ++ ++ br = stobr(sb, bindex); ++ //br_get(br); ++ h_mnt = br->br_mnt; ++ h_sb = h_mnt->mnt_sb; ++ LKTRTrace("%s, h_decode_fh\n", au_sbtype(h_sb)); ++ h_parent = CALL(h_sb->s_export_op, decode_fh) ++ (h_sb, fh + Fh_tail, fh_len - Fh_tail, fh[Fh_h_type], ++ h_acceptable, /*context*/NULL); ++ dentry = h_parent; ++ if (unlikely(!h_parent || IS_ERR(h_parent))) { ++ Warn1("%s decode_fh failed\n", au_sbtype(h_sb)); ++ goto out; ++ } ++ dentry = NULL; ++ if (unlikely(is_anon(h_parent))) { ++ Warn1("%s decode_fh returned a disconnected dentry\n", ++ au_sbtype(h_sb)); ++ dput(h_parent); ++ goto out; ++ } ++ ++ dentry = ERR_PTR(-ENOMEM); ++ path = __getname(); ++ if (unlikely(!path)) { ++ dput(h_parent); ++ goto out; ++ } ++ ++ root = sb->s_root; ++ di_read_lock_parent(root, !AUFS_I_RLOCK); ++ h_root = au_h_dptr_i(root, bindex); ++ di_read_unlock(root, !AUFS_I_RLOCK); ++ arg.h_path = d_path(h_root, h_mnt, path, PATH_MAX); ++ dentry = (void*)arg.h_path; ++ if (unlikely(!arg.h_path || IS_ERR(arg.h_path))) ++ goto out_putname; ++ len = strlen(arg.h_path); ++ arg.h_path = d_path(h_parent, h_mnt, path, PATH_MAX); ++ dentry = (void*)arg.h_path; ++ if (unlikely(!arg.h_path || IS_ERR(arg.h_path))) ++ goto out_putname; ++ LKTRTrace("%s\n", arg.h_path); ++ if (len != 1) ++ arg.h_path += len; ++ LKTRTrace("%s\n", arg.h_path); ++ ++ /* cf. fs/exportfs/expfs.c */ ++ h_file = dentry_open(h_parent, NULL, au_dir_roflags); ++ dentry = (void*)h_file; ++ if (IS_ERR(h_file)) ++ goto out_putname; ++ ++ arg.found = 0; ++ arg.h_ino = decode_ino(fh + Fh_h_ino); ++ do { ++ arg.called = 0; ++ err = vfsub_readdir(h_file, append_name, &arg, /*dlgt*/0); ++ } while (!err && !arg.found && arg.called); ++ LKTRTrace("%s, %d\n", arg.h_path, arg.len); ++ ++ p = d_path(root, stosi(sb)->si_mnt, path, PATH_MAX - arg.len - 2); ++ dentry = (void*)p; ++ if (unlikely(!p || IS_ERR(p))) ++ goto out_fput; ++ p[strlen(p)] = '/'; ++ LKTRTrace("%s\n", p); ++ ++ err = path_lookup(p, LOOKUP_FOLLOW, &nd); ++ dentry = ERR_PTR(err); ++ if (!err) { ++ dentry = dget(nd.dentry); ++ if (unlikely(is_anon(dentry))) { ++ dput(dentry); ++ dentry = ERR_PTR(-ESTALE); ++ } ++ path_release(&nd); ++ } ++ ++ out_fput: ++ fput(h_file); ++ out_putname: ++ __putname(path); ++ out: ++ //br_put(br); ++ TraceErrPtr(dentry); ++ return dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static struct dentry* ++aufs_decode_fh(struct super_block *sb, __u32 *fh, int fh_len, int fh_type, ++ int (*acceptable)(void *context, struct dentry *de), ++ void *context) ++{ ++ struct dentry *dentry; ++ ino_t ino, dir_ino; ++ aufs_bindex_t bindex, br_id, sigen_v; ++ struct inode *inode, *h_inode; ++ ++ //au_debug_on(); ++ LKTRTrace("%d, fh{i%u, br_id_sigen 0x%x, hi%u}\n", ++ fh_type, fh[Fh_ino], fh[Fh_br_id_sigen], fh[Fh_h_ino]); ++ DEBUG_ON(fh_len < Fh_tail); ++ ++ si_read_lock(sb); ++ lockdep_off(); ++ ++ /* branch id may be wrapped around */ ++ dentry = ERR_PTR(-ESTALE); ++ decode_br_id_sigen(fh[Fh_br_id_sigen], &br_id, &sigen_v); ++ bindex = find_brindex(sb, br_id); ++ if (unlikely(bindex < 0 || au_sigen(sb) < sigen_v)) ++ goto out; ++ ++ /* is this inode still cached? */ ++ ino = decode_ino(fh + Fh_ino); ++ dir_ino = decode_ino(fh + Fh_dir_ino); ++ dentry = decode_by_ino(sb, ino, dir_ino); ++ if (IS_ERR(dentry)) ++ goto out; ++ if (dentry) ++ goto accept; ++ ++ /* is the parent dir cached? */ ++ dentry = decode_by_dir_ino(sb, ino, dir_ino); ++ if (IS_ERR(dentry)) ++ goto out; ++ if (dentry) ++ goto accept; ++ ++ /* lookup path */ ++ dentry = decode_by_path(sb, bindex, fh, fh_len, context); ++ if (IS_ERR(dentry)) ++ goto out; ++ if (unlikely(!dentry)) ++ goto out_stale; ++ if (unlikely(dentry->d_inode->i_ino != ino)) ++ goto out_dput; ++ ++ accept: ++ inode = dentry->d_inode; ++ h_inode = NULL; ++ ii_read_lock_child(inode); ++ if (ibstart(inode) <= bindex && bindex <= ibend(inode)) ++ h_inode = au_h_iptr_i(inode, bindex); ++ ii_read_unlock(inode); ++ if (h_inode ++ && h_inode->i_generation == fh[Fh_h_igen] ++ && acceptable(context, dentry)) ++ goto out; /* success */ ++ out_dput: ++ dput(dentry); ++ out_stale: ++ dentry = ERR_PTR(-ESTALE); ++ out: ++ lockdep_on(); ++ si_read_unlock(sb); ++ TraceErrPtr(dentry); ++ //au_debug_off(); ++ return dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int aufs_encode_fh(struct dentry *dentry, __u32 *fh, int *max_len, ++ int connectable) ++{ ++ int err; ++ struct super_block *sb, *h_sb; ++ struct inode *inode, *h_inode, *dir; ++ aufs_bindex_t bindex; ++ union conv u; ++ struct dentry *parent, *h_parent; ++ ++ //au_debug_on(); ++ BUILD_BUG_ON(sizeof(u.ino) != sizeof(u.a)); ++ LKTRTrace("%.*s, max %d, conn %d\n", ++ DLNPair(dentry), *max_len, connectable); ++ DEBUG_ON(is_anon(dentry)); ++ inode = dentry->d_inode; ++ DEBUG_ON(!inode); ++ parent = dentry->d_parent; ++ DEBUG_ON(is_anon(parent)); ++ ++ err = -ENOSPC; ++ if (unlikely(*max_len <= Fh_tail)) { ++ Warn1("NFSv2 client (max_len %d)?\n", *max_len); ++ goto out; ++ } ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ di_read_lock_child(dentry, AUFS_I_RLOCK); ++ di_read_lock_parent(parent, AUFS_I_RLOCK); ++#ifdef CONFIG_AUFS_DEBUG ++ if (unlikely(!au_flag_test(sb, AuFlag_XINO))) ++ Warn1("NFS-exporting requires xino\n"); ++#if 0 ++ if (unlikely(au_flag_test(sb, AuFlag_UDBA_INOTIFY))) ++ Warn1("udba=inotify is not recommended when exporting\n"); ++#endif ++#endif ++ ++ err = -EPERM; ++ bindex = ibstart(inode); ++ h_sb = sbr_sb(sb, bindex); ++ if (unlikely(!h_sb->s_export_op)) { ++ Err1("%s branch is not exportable\n", au_sbtype(h_sb)); ++ goto out_unlock; ++ } ++ ++#if 0 //def CONFIG_AUFS_ROBR ++ if (unlikely(SB_AUFS(h_sb))) { ++ Err1("aufs branch is not supported\n"); ++ goto out_unlock; ++ } ++#endif ++ ++ /* doesn't support pseudo-link */ ++ if (unlikely(bindex < dbstart(dentry) ++ || dbend(dentry) < bindex ++ || !au_h_dptr_i(dentry, bindex))) { ++ Err("%.*s/%.*s, b%d, pseudo-link?\n", ++ DLNPair(dentry->d_parent), DLNPair(dentry), bindex); ++ goto out_unlock; ++ } ++ ++ fh[Fh_br_id_sigen] = encode_br_id_sigen(sbr_id(sb, bindex), ++ au_sigen(sb)); ++ encode_ino(fh + Fh_ino, inode->i_ino); ++ dir = parent->d_inode; ++ encode_ino(fh + Fh_dir_ino, dir->i_ino); ++ h_inode = au_h_iptr(inode); ++ encode_ino(fh + Fh_h_ino, h_inode->i_ino); ++ fh[Fh_h_igen] = h_inode->i_generation; ++ ++ /* it should be set at exporting time */ ++ if (unlikely(!h_sb->s_export_op->find_exported_dentry)) { ++ Warn("set default find_exported_dentry for %s\n", ++ au_sbtype(h_sb)); ++ h_sb->s_export_op->find_exported_dentry = find_exported_dentry; ++ } ++ ++ *max_len -= Fh_tail; ++ //LKTRTrace("Fh_tail %d, max_len %d\n", Fh_tail, *max_len); ++ h_parent = au_h_dptr_i(parent, bindex); ++ DEBUG_ON(is_anon(h_parent)); ++ err = fh[Fh_h_type] = CALL(h_sb->s_export_op, encode_fh) ++ (h_parent, fh + Fh_tail, max_len, connectable); ++ *max_len += Fh_tail; ++ if (err != 255) ++ err = 2; //?? ++ else ++ Warn1("%s encode_fh failed\n", au_sbtype(h_sb)); ++ ++ out_unlock: ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ aufs_read_unlock(dentry, AUFS_I_RLOCK); ++ out: ++ TraceErr(err); ++ //au_debug_off(); ++ if (unlikely(err < 0)) ++ err = 255; ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#if 0 ++struct export_operations { ++ struct dentry *(*decode_fh)(struct super_block *sb, __u32 *fh, int fh_len, int fh_type, ++ int (*acceptable)(void *context, struct dentry *de), ++ void *context); ++ int (*encode_fh)(struct dentry *de, __u32 *fh, int *max_len, ++ int connectable); ++ ++ /* the following are only called from the filesystem itself */ ++ int (*get_name)(struct dentry *parent, char *name, ++ struct dentry *child); ++ struct dentry * (*get_parent)(struct dentry *child); ++ struct dentry * (*get_dentry)(struct super_block *sb, void *inump); ++ ++ /* This is set by the exporting module to a standard helper */ ++ struct dentry * (*find_exported_dentry)( ++ struct super_block *sb, void *obj, void *parent, ++ int (*acceptable)(void *context, struct dentry *de), ++ void *context); ++}; ++#endif ++ ++struct export_operations aufs_export_op = { ++ .decode_fh = aufs_decode_fh, ++ .encode_fh = aufs_encode_fh ++}; +diff --git a/fs/aufs/f_op.c b/fs/aufs/f_op.c +new file mode 100755 +index 0000000..3cd1081 +--- /dev/null ++++ b/fs/aufs/f_op.c +@@ -0,0 +1,684 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: f_op.c,v 1.27 2007/05/14 03:38:24 sfjro Exp $ */ ++ ++#include <linux/fsnotify.h> ++#include <linux/pagemap.h> ++#include <linux/poll.h> ++#include <linux/security.h> ++#include <linux/version.h> ++#include "aufs.h" ++ ++/* common function to regular file and dir */ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++#define FlushArgs hidden_file, id ++int aufs_flush(struct file *file, fl_owner_t id) ++#else ++#define FlushArgs hidden_file ++int aufs_flush(struct file *file) ++#endif ++{ ++ int err; ++ struct dentry *dentry; ++ aufs_bindex_t bindex, bend; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ ++ // aufs_read_lock_file() ++ si_read_lock(dentry->d_sb); ++ fi_read_lock(file); ++ di_read_lock_child(dentry, !AUFS_I_RLOCK); ++ ++ err = 0; ++ bend = fbend(file); ++ for (bindex = fbstart(file); !err && bindex <= bend; bindex++) { ++ struct file *hidden_file; ++ hidden_file = au_h_fptr_i(file, bindex); ++ if (hidden_file && hidden_file->f_op ++ && hidden_file->f_op->flush) ++ err = hidden_file->f_op->flush(FlushArgs); ++ } ++ ++ di_read_unlock(dentry, !AUFS_I_RLOCK); ++ fi_read_unlock(file); ++ si_read_unlock(dentry->d_sb); ++ TraceErr(err); ++ return err; ++} ++#undef FlushArgs ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int do_open_nondir(struct file *file, int flags) ++{ ++ int err; ++ aufs_bindex_t bindex; ++ struct super_block *sb; ++ struct file *hidden_file; ++ struct dentry *dentry; ++ struct inode *inode; ++ struct aufs_finfo *finfo; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, flags 0%o\n", DLNPair(dentry), flags); ++ FiMustWriteLock(file); ++ inode = dentry->d_inode; ++ DEBUG_ON(!inode || S_ISDIR(inode->i_mode)); ++ ++ err = 0; ++ finfo = ftofi(file); ++ finfo->fi_h_vm_ops = NULL; ++ sb = dentry->d_sb; ++ bindex = dbstart(dentry); ++ DEBUG_ON(!au_h_dptr(dentry)->d_inode); ++ /* O_TRUNC is processed already */ ++ BUG_ON(test_ro(sb, bindex, inode) && (flags & O_TRUNC)); ++ ++ hidden_file = hidden_open(dentry, bindex, flags); ++ //if (LktrCond) {fput(hidden_file); br_put(stobr(dentry->d_sb, bindex)); ++ //hidden_file = ERR_PTR(-1);} ++ if (!IS_ERR(hidden_file)) { ++ set_fbstart(file, bindex); ++ set_fbend(file, bindex); ++ set_h_fptr(file, bindex, hidden_file); ++ return 0; /* success */ ++ } ++ err = PTR_ERR(hidden_file); ++ TraceErr(err); ++ return err; ++} ++ ++static int aufs_open_nondir(struct inode *inode, struct file *file) ++{ ++ return au_do_open(inode, file, do_open_nondir); ++} ++ ++static int aufs_release_nondir(struct inode *inode, struct file *file) ++{ ++ struct super_block *sb = file->f_dentry->d_sb; ++ ++ LKTRTrace("i%lu, %.*s\n", inode->i_ino, DLNPair(file->f_dentry)); ++ ++ si_read_lock(sb); ++ au_fin_finfo(file); ++ si_read_unlock(sb); ++ return 0; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static ssize_t aufs_read(struct file *file, char __user *buf, size_t count, ++ loff_t *ppos) ++{ ++ ssize_t err; ++ struct dentry *dentry; ++ struct file *hidden_file; ++ struct super_block *sb; ++ struct inode *h_inode; ++ int dlgt; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, cnt %lu, pos %Ld\n", ++ DLNPair(dentry), (unsigned long)count, *ppos); ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, /*wlock*/0, ++ /*locked*/0); ++ //if (LktrCond) {fi_read_unlock(file); err = -1;} ++ if (unlikely(err)) ++ goto out; ++ ++ /* support LSM and notify */ ++ dlgt = need_dlgt(sb); ++ hidden_file = au_h_fptr(file); ++ h_inode = hidden_file->f_dentry->d_inode; ++ if (!au_flag_test(sb, AuFlag_UDBA_INOTIFY)) ++ err = vfsub_read_u(hidden_file, buf, count, ppos, dlgt); ++ else { ++ struct inode *dir = dentry->d_parent->d_inode, ++ *h_dir = hidden_file->f_dentry->d_parent->d_inode; ++ aufs_bindex_t bstart = fbstart(file); ++ hdir_lock(h_dir, dir, bstart); ++ err = vfsub_read_u(hidden_file, buf, count, ppos, dlgt); ++ hdir_unlock(h_dir, dir, bstart); ++ } ++ memcpy(&file->f_ra, &hidden_file->f_ra, sizeof(file->f_ra)); //?? ++ dentry->d_inode->i_atime = hidden_file->f_dentry->d_inode->i_atime; ++ ++ fi_read_unlock(file); ++ out: ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++static ssize_t aufs_write(struct file *file, const char __user *__buf, ++ size_t count, loff_t *ppos) ++{ ++ ssize_t err; ++ struct dentry *dentry; ++ struct inode *inode; ++ struct super_block *sb; ++ struct file *hidden_file; ++ char __user *buf = (char __user*)__buf; ++ struct inode *h_inode; ++ int dlgt; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, cnt %lu, pos %Ld\n", ++ DLNPair(dentry), (unsigned long)count, *ppos); ++ ++ inode = dentry->d_inode; ++ i_lock(inode); ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, /*wlock*/1, ++ /*locked*/1); ++ //if (LktrCond) {fi_write_unlock(file); err = -1;} ++ if (unlikely(err)) ++ goto out; ++ err = au_ready_to_write(file, -1); ++ //if (LktrCond) err = -1; ++ if (unlikely(err)) ++ goto out_unlock; ++ ++ /* support LSM and notify */ ++ dlgt = need_dlgt(sb); ++ hidden_file = au_h_fptr(file); ++ h_inode = hidden_file->f_dentry->d_inode; ++ if (!au_flag_test(sb, AuFlag_UDBA_INOTIFY)) ++ err = vfsub_write_u(hidden_file, buf, count, ppos, dlgt); ++ else { ++ struct inode *dir = dentry->d_parent->d_inode, ++ *h_dir = hidden_file->f_dentry->d_parent->d_inode; ++ aufs_bindex_t bstart = fbstart(file); ++ hdir_lock(h_dir, dir, bstart); ++ err = vfsub_write_u(hidden_file, buf, count, ppos, dlgt); ++ hdir_unlock(h_dir, dir, bstart); ++ } ++ ii_write_lock_child(inode); ++ au_cpup_attr_timesizes(inode); ++ ii_write_unlock(inode); ++ ++ out_unlock: ++ fi_write_unlock(file); ++ out: ++ si_read_unlock(sb); ++ i_unlock(inode); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#if 0 //def CONFIG_AUFS_ROBR ++struct lvma { ++ struct list_head list; ++ struct vm_area_struct *vma; ++}; ++ ++static struct file *safe_file(struct vm_area_struct *vma) ++{ ++ struct file *file = vma->vm_file; ++ struct super_block *sb = file->f_dentry->d_sb; ++ struct lvma *lvma, *entry; ++ struct aufs_sbinfo *sbinfo; ++ int found, warn; ++ ++ TraceEnter(); ++ DEBUG_ON(!SB_AUFS(sb)); ++ ++ warn = 0; ++ found = 0; ++ sbinfo = stosi(sb); ++ spin_lock(&sbinfo->si_lvma_lock); ++ list_for_each_entry(entry, &sbinfo->si_lvma, list) { ++ found = (entry->vma == vma); ++ if (unlikely(found)) ++ break; ++ } ++ if (!found) { ++ lvma = kmalloc(sizeof(*lvma), GFP_ATOMIC); ++ if (lvma) { ++ lvma->vma = vma; ++ list_add(&lvma->list, &sbinfo->si_lvma); ++ } else { ++ warn = 1; ++ file = NULL; ++ } ++ } else ++ file = NULL; ++ spin_unlock(&sbinfo->si_lvma_lock); ++ ++ if (unlikely(warn)) ++ Warn1("no memory for lvma\n"); ++ return file; ++} ++ ++static void reset_file(struct vm_area_struct *vma, struct file *file) ++{ ++ struct super_block *sb = file->f_dentry->d_sb; ++ struct lvma *entry, *found; ++ struct aufs_sbinfo *sbinfo; ++ ++ TraceEnter(); ++ DEBUG_ON(!SB_AUFS(sb)); ++ ++ vma->vm_file = file; ++ ++ found = NULL; ++ sbinfo = stosi(sb); ++ spin_lock(&sbinfo->si_lvma_lock); ++ list_for_each_entry(entry, &sbinfo->si_lvma, list) ++ if (entry->vma == vma){ ++ found = entry; ++ break; ++ } ++ DEBUG_ON(!found); ++ list_del(&found->list); ++ spin_unlock(&sbinfo->si_lvma_lock); ++ kfree(found); ++} ++ ++#else ++ ++static struct file *safe_file(struct vm_area_struct *vma) ++{ ++ struct file *file; ++ ++ file = vma->vm_file; ++ if (file->private_data && au_is_aufs(file->f_dentry->d_sb)) ++ return file; ++ return NULL; ++} ++ ++static void reset_file(struct vm_area_struct *vma, struct file *file) ++{ ++ vma->vm_file = file; ++ smp_mb(); ++} ++#endif /* CONFIG_AUFS_ROBR */ ++ ++static struct page *aufs_nopage(struct vm_area_struct *vma, unsigned long addr, ++ int *type) ++{ ++ struct page *page; ++ struct dentry *dentry; ++ struct file *file, *hidden_file; ++ struct inode *inode; ++ static DECLARE_WAIT_QUEUE_HEAD(wq); ++ struct aufs_finfo *finfo; ++ ++ TraceEnter(); ++ DEBUG_ON(!vma || !vma->vm_file); ++ wait_event(wq, (file = safe_file(vma))); ++ DEBUG_ON(!au_is_aufs(file->f_dentry->d_sb)); ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, addr %lx\n", DLNPair(dentry), addr); ++ inode = dentry->d_inode; ++ DEBUG_ON(!S_ISREG(inode->i_mode)); ++ ++ // do not revalidate, nor lock ++ finfo = ftofi(file); ++ hidden_file = finfo->fi_hfile[0 + finfo->fi_bstart].hf_file; ++ DEBUG_ON(!hidden_file || !au_is_mmapped(file)); ++ vma->vm_file = hidden_file; ++ //smp_mb(); ++ page = finfo->fi_h_vm_ops->nopage(vma, addr, type); ++ reset_file(vma, file); ++#if 0 //def CONFIG_SMP ++ //wake_up_nr(&wq, online_cpu - 1); ++ wake_up_all(&wq); ++#else ++ wake_up(&wq); ++#endif ++ if (!IS_ERR(page)) { ++ //page->mapping = file->f_mapping; ++ //get_page(page); ++ //file->f_mapping = hidden_file->f_mapping; ++ //touch_atime(NULL, dentry); ++ //inode->i_atime = hidden_file->f_dentry->d_inode->i_atime; ++ } ++ TraceErrPtr(page); ++ return page; ++} ++ ++static int aufs_populate(struct vm_area_struct *vma, unsigned long addr, ++ unsigned long len, pgprot_t prot, unsigned long pgoff, ++ int nonblock) ++{ ++ Err("please report me this application\n"); ++ BUG(); ++ return ftofi(vma->vm_file)->fi_h_vm_ops->populate ++ (vma, addr, len, prot, pgoff, nonblock); ++} ++ ++static struct vm_operations_struct aufs_vm_ops = { ++ //.open = aufs_vmaopen, ++ //.close = aufs_vmaclose, ++ .nopage = aufs_nopage, ++ .populate = aufs_populate, ++ //page_mkwrite(struct vm_area_struct *vma, struct page *page) ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int aufs_mmap(struct file *file, struct vm_area_struct *vma) ++{ ++ int err, wlock, mmapped; ++ struct dentry *dentry; ++ struct super_block *sb; ++ struct file *h_file; ++ struct vm_operations_struct *vm_ops; ++ unsigned long flags; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, %lx, len %lu\n", ++ DLNPair(dentry), vma->vm_start, vma->vm_end - vma->vm_start); ++ DEBUG_ON(!S_ISREG(dentry->d_inode->i_mode)); ++ DEBUG_ON(down_write_trylock(&vma->vm_mm->mmap_sem)); ++ ++ mmapped = au_is_mmapped(file); ++ wlock = 0; ++ if (file->f_mode & FMODE_WRITE) { ++ flags = VM_SHARED | VM_WRITE; ++ wlock = ((flags & vma->vm_flags) == flags); ++ } ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, ++ wlock | !mmapped, /*locked*/0); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ ++ if (wlock) { ++ err = au_ready_to_write(file, -1); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_unlock; ++ } ++ ++ h_file = au_h_fptr(file); ++ vm_ops = ftofi(file)->fi_h_vm_ops; ++ if (unlikely(!mmapped)) { ++ // nfs uses some locks ++ lockdep_off(); ++ err = h_file->f_op->mmap(h_file, vma); ++ lockdep_on(); ++ if (unlikely(err)) ++ goto out_unlock; ++ vm_ops = vma->vm_ops; ++ DEBUG_ON(!vm_ops); ++ err = do_munmap(current->mm, vma->vm_start, ++ vma->vm_end - vma->vm_start); ++ if (unlikely(err)) { ++ IOErr("failed internal unmapping %.*s, %d\n", ++ DLNPair(h_file->f_dentry), err); ++ err = -EIO; ++ goto out_unlock; ++ } ++ } ++ DEBUG_ON(!vm_ops); ++ ++ err = generic_file_mmap(file, vma); ++ if (!err) { ++ file_accessed(h_file); ++ dentry->d_inode->i_atime = h_file->f_dentry->d_inode->i_atime; ++ vma->vm_ops = &aufs_vm_ops; ++ if (unlikely(!mmapped)) ++ ftofi(file)->fi_h_vm_ops = vm_ops; ++ } ++ ++ out_unlock: ++ if (!wlock && mmapped) ++ fi_read_unlock(file); ++ else ++ fi_write_unlock(file); ++ out: ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++// todo: try do_sendfile() in fs/read_write.c ++static ssize_t aufs_sendfile(struct file *file, loff_t *ppos, ++ size_t count, read_actor_t actor, void *target) ++{ ++ ssize_t err; ++ struct file *h_file; ++ const char c = current->comm[4]; ++ /* true if a kernel thread named 'loop[0-9].*' accesses a file */ ++ const int loopback = (current->mm == NULL ++ && '0' <= c && c <= '9' ++ && strncmp(current->comm, "loop", 4) == 0); ++ struct dentry *dentry; ++ struct super_block *sb; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, pos %Ld, cnt %lu, loopback %d\n", ++ DLNPair(dentry), *ppos, (unsigned long)count, loopback); ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, /*wlock*/0, ++ /*locked*/0); ++ if (unlikely(err)) ++ goto out; ++ ++ err = -EINVAL; ++ h_file = au_h_fptr(file); ++ if (h_file->f_op && h_file->f_op->sendfile) { ++ if (/* unlikely */(loopback)) { ++ file->f_mapping = h_file->f_mapping; ++ smp_mb(); //?? ++ } ++ // nfs uses some locks ++ lockdep_off(); ++ err = h_file->f_op->sendfile ++ (h_file, ppos, count, actor, target); ++ lockdep_on(); ++ dentry->d_inode->i_atime = h_file->f_dentry->d_inode->i_atime; ++ } ++ fi_read_unlock(file); ++ ++ out: ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* copied from linux/fs/select.h, must match */ ++#define DEFAULT_POLLMASK (POLLIN | POLLOUT | POLLRDNORM | POLLWRNORM) ++ ++static unsigned int aufs_poll(struct file *file, poll_table *wait) ++{ ++ unsigned int mask; ++ struct file *hidden_file; ++ int err; ++ struct dentry *dentry; ++ struct super_block *sb; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, wait %p\n", DLNPair(dentry), wait); ++ DEBUG_ON(S_ISDIR(dentry->d_inode->i_mode)); ++ ++ /* We should pretend an error happend. */ ++ mask = POLLERR /* | POLLIN | POLLOUT */; ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, /*wlock*/0, ++ /*locked*/0); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ ++ /* it is not an error of hidden_file has no operation */ ++ mask = DEFAULT_POLLMASK; ++ hidden_file = au_h_fptr(file); ++ if (hidden_file->f_op && hidden_file->f_op->poll) ++ mask = hidden_file->f_op->poll(hidden_file, wait); ++ fi_read_unlock(file); ++ ++ out: ++ si_read_unlock(sb); ++ TraceErr((int)mask); ++ return mask; ++} ++ ++static int aufs_fsync_nondir(struct file *file, struct dentry *dentry, ++ int datasync) ++{ ++ int err, my_lock; ++ struct inode *inode; ++ struct file *hidden_file; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, %d\n", DLNPair(dentry), datasync); ++ inode = dentry->d_inode; ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,17) ++ IMustLock(inode); ++ my_lock = 0; ++#else ++ /* before 2.6.17, ++ * msync(2) calls me without locking i_sem/i_mutex, but fsync(2). ++ */ ++ my_lock = !i_trylock(inode); ++#endif ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = 0; //-EBADF; // posix? ++ if (unlikely(!(file->f_mode & FMODE_WRITE))) ++ goto out; ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, /*wlock*/1, ++ /*locked*/1); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ err = au_ready_to_write(file, -1); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_unlock; ++ ++ err = -EINVAL; ++ hidden_file = au_h_fptr(file); ++ if (hidden_file->f_op && hidden_file->f_op->fsync) { ++ // todo: apparmor thread? ++ //file->f_mapping->host->i_mutex ++ ii_write_lock_child(inode); ++ hi_lock_child(hidden_file->f_dentry->d_inode); ++ err = hidden_file->f_op->fsync ++ (hidden_file, hidden_file->f_dentry, datasync); ++ //err = -1; ++ au_cpup_attr_timesizes(inode); ++ i_unlock(hidden_file->f_dentry->d_inode); ++ ii_write_unlock(inode); ++ } ++ ++ out_unlock: ++ fi_write_unlock(file); ++ out: ++ if (unlikely(my_lock)) ++ i_unlock(inode); ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++static int aufs_fasync(int fd, struct file *file, int flag) ++{ ++ int err; ++ struct file *hidden_file; ++ struct dentry *dentry; ++ struct super_block *sb; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, %d\n", DLNPair(dentry), flag); ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ err = au_reval_and_lock_finfo(file, au_reopen_nondir, /*wlock*/0, ++ /*locked*/0); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ ++ hidden_file = au_h_fptr(file); ++ if (hidden_file->f_op && hidden_file->f_op->fasync) ++ err = hidden_file->f_op->fasync(fd, hidden_file, flag); ++ fi_read_unlock(file); ++ ++ out: ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#if 0 // comment ++struct file_operations { ++ struct module *owner; ++ loff_t (*llseek) (struct file *, loff_t, int); ++ ssize_t (*read) (struct file *, char __user *, size_t, loff_t *); ++ ssize_t (*aio_read) (struct kiocb *, char __user *, size_t, loff_t); ++ ssize_t (*write) (struct file *, const char __user *, size_t, loff_t *); ++ ssize_t (*aio_write) (struct kiocb *, const char __user *, size_t, loff_t); ++ int (*readdir) (struct file *, void *, filldir_t); ++ unsigned int (*poll) (struct file *, struct poll_table_struct *); ++ int (*ioctl) (struct inode *, struct file *, unsigned int, unsigned long); ++ long (*unlocked_ioctl) (struct file *, unsigned int, unsigned long); ++ long (*compat_ioctl) (struct file *, unsigned int, unsigned long); ++ int (*mmap) (struct file *, struct vm_area_struct *); ++ int (*open) (struct inode *, struct file *); ++ int (*flush) (struct file *); ++ int (*release) (struct inode *, struct file *); ++ int (*fsync) (struct file *, struct dentry *, int datasync); ++ int (*aio_fsync) (struct kiocb *, int datasync); ++ int (*fasync) (int, struct file *, int); ++ int (*lock) (struct file *, int, struct file_lock *); ++ ssize_t (*readv) (struct file *, const struct iovec *, unsigned long, loff_t *); ++ ssize_t (*writev) (struct file *, const struct iovec *, unsigned long, loff_t *); ++ ssize_t (*sendfile) (struct file *, loff_t *, size_t, read_actor_t, void *); ++ ssize_t (*sendpage) (struct file *, struct page *, int, size_t, loff_t *, int); ++ unsigned long (*get_unmapped_area)(struct file *, unsigned long, unsigned long, unsigned long, unsigned long); ++ int (*check_flags)(int); ++ int (*dir_notify)(struct file *file, unsigned long arg); ++ int (*flock) (struct file *, int, struct file_lock *); ++}; ++#endif ++ ++struct file_operations aufs_file_fop = { ++ .read = aufs_read, ++ .write = aufs_write, ++ .poll = aufs_poll, ++ .mmap = aufs_mmap, ++ .open = aufs_open_nondir, ++ .flush = aufs_flush, ++ .release = aufs_release_nondir, ++ .fsync = aufs_fsync_nondir, ++ .fasync = aufs_fasync, ++ .sendfile = aufs_sendfile, ++}; +diff --git a/fs/aufs/file.c b/fs/aufs/file.c +new file mode 100755 +index 0000000..857a4e8 +--- /dev/null ++++ b/fs/aufs/file.c +@@ -0,0 +1,832 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: file.c,v 1.42 2007/05/14 03:39:09 sfjro Exp $ */ ++ ++//#include <linux/fsnotify.h> ++#include <linux/pagemap.h> ++//#include <linux/poll.h> ++//#include <linux/security.h> ++#include "aufs.h" ++ ++/* drop flags for writing */ ++unsigned int au_file_roflags(unsigned int flags) ++{ ++ flags &= ~(O_WRONLY | O_RDWR | O_APPEND | O_CREAT | O_TRUNC); ++ flags |= O_RDONLY | O_NOATIME; ++ return flags; ++} ++ ++/* common functions to regular file and dir */ ++struct file *hidden_open(struct dentry *dentry, aufs_bindex_t bindex, int flags) ++{ ++ struct dentry *hidden_dentry; ++ struct inode *hidden_inode; ++ struct super_block *sb; ++ struct vfsmount *hidden_mnt; ++ struct file *hidden_file; ++ struct aufs_branch *br; ++ loff_t old_size; ++ int udba; ++ ++ LKTRTrace("%.*s, b%d, flags 0%o\n", DLNPair(dentry), bindex, flags); ++ DEBUG_ON(!dentry); ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ DEBUG_ON(!hidden_dentry); ++ hidden_inode = hidden_dentry->d_inode; ++ DEBUG_ON(!hidden_inode); ++ ++ sb = dentry->d_sb; ++ udba = au_flag_test(sb, AuFlag_UDBA_INOTIFY); ++ if (unlikely(udba)) { ++ // test here? ++ } ++ ++ br = stobr(sb, bindex); ++ br_get(br); ++ /* drop flags for writing */ ++ if (test_ro(sb, bindex, dentry->d_inode)) ++ flags = au_file_roflags(flags); ++ flags &= ~O_CREAT; ++ spin_lock(&hidden_inode->i_lock); ++ old_size = i_size_read(hidden_inode); ++ spin_unlock(&hidden_inode->i_lock); ++ ++ //DbgSleep(3); ++ ++ dget(hidden_dentry); ++ hidden_mnt = mntget(br->br_mnt); ++ hidden_file = dentry_open(hidden_dentry, hidden_mnt, flags); ++ //if (LktrCond) {fput(hidden_file); hidden_file = ERR_PTR(-1);} ++ ++ if (!IS_ERR(hidden_file)) { ++#if 0 // remove this ++ if (/* old_size && */ (flags & O_TRUNC)) { ++ au_direval_dec(dentry); ++ if (!IS_ROOT(dentry)) ++ au_direval_dec(dentry->d_parent); ++ } ++#endif ++ return hidden_file; ++ } ++ ++ br_put(br); ++ TraceErrPtr(hidden_file); ++ return hidden_file; ++} ++ ++static int do_coo(struct dentry *dentry, aufs_bindex_t bstart) ++{ ++ int err; ++ struct dentry *parent, *h_parent, *h_dentry; ++ aufs_bindex_t bcpup; ++ struct inode *h_dir, *h_inode, *dir; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ DEBUG_ON(IS_ROOT(dentry)); ++ DiMustWriteLock(dentry); ++ ++ parent = dentry->d_parent; // dget_parent() ++ di_write_lock_parent(parent); ++ bcpup = err = find_rw_parent_br(dentry, bstart); ++ //bcpup = err = find_rw_br(sb, bstart); ++ if (unlikely(err < 0)) { ++ err = 0; // stop copyup, it is not an error ++ goto out; ++ } ++ err = 0; ++ ++ h_parent = au_h_dptr_i(parent, bcpup); ++ if (!h_parent) { ++ err = cpup_dirs(dentry, bcpup, NULL); ++ if (unlikely(err)) ++ goto out; ++ h_parent = au_h_dptr_i(parent, bcpup); ++ } ++ ++ h_dir = h_parent->d_inode; ++ h_dentry = au_h_dptr_i(dentry, bstart); ++ h_inode = h_dentry->d_inode; ++ dir = parent->d_inode; ++ hdir_lock(h_dir, dir, bcpup); ++ hi_lock_child(h_inode); ++ DEBUG_ON(au_h_dptr_i(dentry, bcpup)); ++ err = sio_cpup_simple(dentry, bcpup, -1, ++ au_flags_cpup(CPUP_DTIME, parent)); ++ TraceErr(err); ++ i_unlock(h_inode); ++ hdir_unlock(h_dir, dir, bcpup); ++ ++ out: ++ di_write_unlock(parent); ++ TraceErr(err); ++ return err; ++} ++ ++int au_do_open(struct inode *inode, struct file *file, ++ int (*open)(struct file *file, int flags)) ++{ ++ int err, coo; ++ struct dentry *dentry; ++ struct super_block *sb; ++ aufs_bindex_t bstart; ++ struct inode *h_dir, *dir; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("i%lu, %.*s\n", inode->i_ino, DLNPair(dentry)); ++ ++ sb = dentry->d_sb; ++ si_read_lock(sb); ++ coo = 0; ++#if 0 ++ switch (au_flag_test_coo(sb)) { ++ case AuFlag_COO_LEAF: ++ coo = !S_ISDIR(inode->i_mode); ++ break; ++ case AuFlag_COO_ALL: ++ coo = 1; ++ break; ++ } ++#endif ++ err = au_init_finfo(file); ++ //if (LktrCond) {fi_write_unlock(file); fin_finfo(file); err = -1;} ++ if (unlikely(err)) ++ goto out; ++ ++ if (!coo) { ++ di_read_lock_child(dentry, AUFS_I_RLOCK); ++ bstart = dbstart(dentry); ++ } else { ++ di_write_lock_child(dentry); ++ bstart = dbstart(dentry); ++ if (test_ro(sb, bstart, dentry->d_inode)) { ++ err = do_coo(dentry, bstart); ++ if (err) { ++ di_write_unlock(dentry); ++ goto out_finfo; ++ } ++ bstart = dbstart(dentry); ++ } ++ di_downgrade_lock(dentry, AUFS_I_RLOCK); ++ } ++ ++ // todo: remove this extra locks ++ dir = dentry->d_parent->d_inode; ++ if (!IS_ROOT(dentry)) ++ ii_read_lock_parent(dir); ++ h_dir = au_h_iptr_i(dir, bstart); ++ hdir_lock(h_dir, dir, bstart); ++ err = open(file, file->f_flags); ++ //if (LktrCond) err = -1; ++ hdir_unlock(h_dir, dir, bstart); ++ if (!IS_ROOT(dentry)) ++ ii_read_unlock(dir); ++ di_read_unlock(dentry, AUFS_I_RLOCK); ++ ++ out_finfo: ++ fi_write_unlock(file); ++ if (unlikely(err)) ++ au_fin_finfo(file); ++ //DbgFile(file); ++ out: ++ si_read_unlock(sb); ++ TraceErr(err); ++ return err; ++} ++ ++int au_reopen_nondir(struct file *file) ++{ ++ int err; ++ struct dentry *dentry; ++ aufs_bindex_t bstart, bindex, bend; ++ struct file *hidden_file, *h_file_tmp; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ DEBUG_ON(S_ISDIR(dentry->d_inode->i_mode) ++ || !au_h_dptr(dentry)->d_inode); ++ bstart = dbstart(dentry); ++ ++ h_file_tmp = NULL; ++ if (fbstart(file) == bstart) { ++ hidden_file = au_h_fptr(file); ++ if (file->f_mode == hidden_file->f_mode) ++ return 0; /* success */ ++ h_file_tmp = hidden_file; ++ get_file(h_file_tmp); ++ set_h_fptr(file, bstart, NULL); ++ } ++ DEBUG_ON(fbstart(file) < bstart ++ || ftofi(file)->fi_hfile[0 + bstart].hf_file); ++ ++ hidden_file = hidden_open(dentry, bstart, file->f_flags & ~O_TRUNC); ++ //if (LktrCond) {fput(hidden_file); br_put(stobr(dentry->d_sb, bstart)); ++ //hidden_file = ERR_PTR(-1);} ++ err = PTR_ERR(hidden_file); ++ if (IS_ERR(hidden_file)) ++ goto out; // close all? ++ err = 0; ++ //cpup_file_flags(hidden_file, file); ++ set_fbstart(file, bstart); ++ set_h_fptr(file, bstart, hidden_file); ++ memcpy(&hidden_file->f_ra, &file->f_ra, sizeof(file->f_ra)); //?? ++ ++ /* close lower files */ ++ bend = fbend(file); ++ for (bindex = bstart + 1; bindex <= bend; bindex++) ++ set_h_fptr(file, bindex, NULL); ++ set_fbend(file, bstart); ++ ++ out: ++ if (h_file_tmp) ++ fput(h_file_tmp); ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * copyup the deleted file for writing. ++ */ ++static int cpup_wh_file(struct file *file, aufs_bindex_t bdst, loff_t len) ++{ ++ int err; ++ struct dentry *dentry, *parent, *hidden_parent, *tmp_dentry; ++ struct dentry *hidden_dentry_bstart, *hidden_dentry_bdst; ++ struct inode *hidden_dir; ++ aufs_bindex_t bstart; ++ struct aufs_dinfo *dinfo; ++ struct dtime dt; ++ struct lkup_args lkup; ++ struct super_block *sb; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, bdst %d, len %Lu\n", DLNPair(dentry), bdst, len); ++ DEBUG_ON(S_ISDIR(dentry->d_inode->i_mode) ++ || !(file->f_mode & FMODE_WRITE)); ++ DiMustWriteLock(dentry); ++ parent = dentry->d_parent; ++ IiMustAnyLock(parent->d_inode); ++ hidden_parent = au_h_dptr_i(parent, bdst); ++ DEBUG_ON(!hidden_parent); ++ hidden_dir = hidden_parent->d_inode; ++ DEBUG_ON(!hidden_dir); ++ IMustLock(hidden_dir); ++ ++ sb = parent->d_sb; ++ lkup.nfsmnt = au_nfsmnt(sb, bdst); ++ lkup.dlgt = need_dlgt(sb); ++ tmp_dentry = lkup_whtmp(hidden_parent, &dentry->d_name, &lkup); ++ //if (LktrCond) {dput(tmp_dentry); tmp_dentry = ERR_PTR(-1);} ++ err = PTR_ERR(tmp_dentry); ++ if (IS_ERR(tmp_dentry)) ++ goto out; ++ ++ dtime_store(&dt, parent, hidden_parent); ++ dinfo = dtodi(dentry); ++ bstart = dinfo->di_bstart; ++ hidden_dentry_bdst = dinfo->di_hdentry[0 + bdst].hd_dentry; ++ hidden_dentry_bstart = dinfo->di_hdentry[0 + bstart].hd_dentry; ++ dinfo->di_bstart = bdst; ++ dinfo->di_hdentry[0 + bdst].hd_dentry = tmp_dentry; ++ dinfo->di_hdentry[0 + bstart].hd_dentry = au_h_fptr(file)->f_dentry; ++ err = cpup_single(dentry, bdst, bstart, len, ++ au_flags_cpup(!CPUP_DTIME, parent)); ++ //if (LktrCond) err = -1; ++ if (!err) ++ err = au_reopen_nondir(file); ++ //err = -1; ++ dinfo->di_hdentry[0 + bstart].hd_dentry = hidden_dentry_bstart; ++ dinfo->di_hdentry[0 + bdst].hd_dentry = hidden_dentry_bdst; ++ dinfo->di_bstart = bstart; ++ if (unlikely(err)) ++ goto out_tmp; ++ ++ DEBUG_ON(!d_unhashed(dentry)); ++ err = vfsub_unlink(hidden_dir, tmp_dentry, lkup.dlgt); ++ //if (LktrCond) err = -1; ++ if (unlikely(err)) { ++ IOErr("failed remove copied-up tmp file %.*s(%d)\n", ++ DLNPair(tmp_dentry), err); ++ err = -EIO; ++ } ++ dtime_revert(&dt, !CPUP_LOCKED_GHDIR); ++ ++ out_tmp: ++ dput(tmp_dentry); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++struct cpup_wh_file_args { ++ int *errp; ++ struct file *file; ++ aufs_bindex_t bdst; ++ loff_t len; ++}; ++ ++static void call_cpup_wh_file(void *args) ++{ ++ struct cpup_wh_file_args *a = args; ++ *a->errp = cpup_wh_file(a->file, a->bdst, a->len); ++} ++ ++/* ++ * prepare the @file for writing. ++ */ ++int au_ready_to_write(struct file *file, loff_t len) ++{ ++ int err; ++ struct dentry *dentry, *parent, *hidden_dentry, *hidden_parent; ++ struct inode *hidden_inode, *hidden_dir, *inode, *dir; ++ struct super_block *sb; ++ aufs_bindex_t bstart, bcpup; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, len %Ld\n", DLNPair(dentry), len); ++ FiMustWriteLock(file); ++ ++ sb = dentry->d_sb; ++ bstart = fbstart(file); ++ DEBUG_ON(ftobr(file, bstart) != stobr(sb, bstart)); ++ ++ inode = dentry->d_inode; ++ ii_read_lock_child(inode); ++ LKTRTrace("rdonly %d, bstart %d\n", test_ro(sb, bstart, inode), bstart); ++ err = test_ro(sb, bstart, inode); ++ ii_read_unlock(inode); ++ if (!err && (au_h_fptr(file)->f_mode & FMODE_WRITE)) ++ return 0; ++ ++ /* need to cpup */ ++ parent = dentry->d_parent; // dget_parent() ++ di_write_lock_child(dentry); ++ di_write_lock_parent(parent); ++ bcpup = err = find_rw_parent_br(dentry, bstart); ++ //bcpup = err = find_rw_br(sb, bstart); ++ if (unlikely(err < 0)) ++ goto out_unlock; ++ err = 0; ++ ++ hidden_parent = au_h_dptr_i(parent, bcpup); ++ if (!hidden_parent) { ++ err = cpup_dirs(dentry, bcpup, NULL); ++ //if (LktrCond) err = -1; ++ if (unlikely(err)) ++ goto out_unlock; ++ hidden_parent = au_h_dptr_i(parent, bcpup); ++ } ++ ++ hidden_dir = hidden_parent->d_inode; ++ hidden_dentry = au_h_fptr(file)->f_dentry; ++ hidden_inode = hidden_dentry->d_inode; ++ dir = parent->d_inode; ++ hdir_lock(hidden_dir, dir, bcpup); ++ hi_lock_child(hidden_inode); ++ if (d_unhashed(dentry) || d_unhashed(hidden_dentry) ++ /* || !hidden_inode->i_nlink */) { ++ if (!au_test_perm(hidden_dir, MAY_EXEC | MAY_WRITE, ++ need_dlgt(sb))) ++ err = cpup_wh_file(file, bcpup, len); ++ else { ++ struct cpup_wh_file_args args = { ++ .errp = &err, ++ .file = file, ++ .bdst = bcpup, ++ .len = len ++ }; ++ au_wkq_wait(call_cpup_wh_file, &args, /*dlgt*/0); ++ } ++ //if (LktrCond) err = -1; ++ TraceErr(err); ++ } else { ++ if (!au_h_dptr_i(dentry, bcpup)) ++ err = sio_cpup_simple(dentry, bcpup, len, ++ au_flags_cpup(CPUP_DTIME, ++ parent)); ++ //if (LktrCond) err = -1; ++ TraceErr(err); ++ if (!err) ++ err = au_reopen_nondir(file); ++ //if (LktrCond) err = -1; ++ TraceErr(err); ++ } ++ i_unlock(hidden_inode); ++ hdir_unlock(hidden_dir, dir, bcpup); ++ ++ out_unlock: ++ di_write_unlock(parent); ++ di_write_unlock(dentry); ++// out: ++ TraceErr(err); ++ return err; ++ ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * after branch manipulating, refresh the file. ++ */ ++static int refresh_file(struct file *file, int (*reopen)(struct file *file)) ++{ ++ int err, new_sz; ++ struct dentry *dentry; ++ aufs_bindex_t bend, bindex, bstart, brid; ++ struct aufs_hfile *p; ++ struct aufs_finfo *finfo; ++ struct super_block *sb; ++ struct inode *inode; ++ struct file *hidden_file; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ FiMustWriteLock(file); ++ DiMustReadLock(dentry); ++ inode = dentry->d_inode; ++ IiMustReadLock(inode); ++ //au_debug_on(); ++ //DbgDentry(dentry); ++ //DbgFile(file); ++ //au_debug_off(); ++ ++ err = -ENOMEM; ++ sb = dentry->d_sb; ++ finfo = ftofi(file); ++ bstart = finfo->fi_bstart; ++ bend = finfo->fi_bstart; ++ new_sz = sizeof(*finfo->fi_hfile) * (sbend(sb) + 1); ++ p = au_kzrealloc(finfo->fi_hfile, sizeof(*p) * (finfo->fi_bend + 1), ++ new_sz, GFP_KERNEL); ++ //p = NULL; ++ if (unlikely(!p)) ++ goto out; ++ finfo->fi_hfile = p; ++ hidden_file = p[0 + bstart].hf_file; ++ ++ p = finfo->fi_hfile + finfo->fi_bstart; ++ brid = p->hf_br->br_id; ++ bend = finfo->fi_bend; ++ for (bindex = finfo->fi_bstart; bindex <= bend; bindex++, p++) { ++ struct aufs_hfile tmp, *q; ++ aufs_bindex_t new_bindex; ++ ++ if (!p->hf_file) ++ continue; ++ new_bindex = find_bindex(sb, p->hf_br); ++ if (new_bindex == bindex) ++ continue; ++ if (new_bindex < 0) { // test here ++ set_h_fptr(file, bindex, NULL); ++ continue; ++ } ++ ++ /* swap two hidden inode, and loop again */ ++ q = finfo->fi_hfile + new_bindex; ++ tmp = *q; ++ *q = *p; ++ *p = tmp; ++ if (tmp.hf_file) { ++ bindex--; ++ p--; ++ } ++ } ++ { ++ aufs_bindex_t s = finfo->fi_bstart, e = finfo->fi_bend; ++ finfo->fi_bstart = 0; ++ finfo->fi_bend = sbend(sb); ++ //au_debug_on(); ++ //DbgFile(file); ++ //au_debug_off(); ++ finfo->fi_bstart = s; ++ finfo->fi_bend = e; ++ } ++ ++ p = finfo->fi_hfile; ++ if (!au_is_mmapped(file) && !d_unhashed(dentry)) { ++ bend = sbend(sb); ++ for (finfo->fi_bstart = 0; finfo->fi_bstart <= bend; ++ finfo->fi_bstart++, p++) ++ if (p->hf_file) { ++ if (p->hf_file->f_dentry ++ && p->hf_file->f_dentry->d_inode) ++ break; ++ else ++ au_hfput(p); ++ } ++ } else { ++ bend = find_brindex(sb, brid); ++ //LKTRTrace("%d\n", bend); ++ for (finfo->fi_bstart = 0; finfo->fi_bstart < bend; ++ finfo->fi_bstart++, p++) ++ if (p->hf_file) ++ au_hfput(p); ++ //LKTRTrace("%d\n", finfo->fi_bstart); ++ bend = sbend(sb); ++ } ++ ++ p = finfo->fi_hfile + bend; ++ for (finfo->fi_bend = bend; finfo->fi_bend >= finfo->fi_bstart; ++ finfo->fi_bend--, p--) ++ if (p->hf_file) { ++ if (p->hf_file->f_dentry ++ && p->hf_file->f_dentry->d_inode) ++ break; ++ else ++ au_hfput(p); ++ } ++ //Dbg("%d, %d\n", finfo->fi_bstart, finfo->fi_bend); ++ DEBUG_ON(finfo->fi_bend < finfo->fi_bstart); ++ //DbgFile(file); ++ //DbgDentry(file->f_dentry); ++ ++ err = 0; ++#if 0 // todo: ++ if (!au_h_dptr(dentry)->d_inode) { ++ au_update_figen(file); ++ goto out; /* success */ ++ } ++#endif ++ ++ if (unlikely(au_is_mmapped(file) || d_unhashed(dentry))) ++ goto out_update; /* success */ ++ ++ again: ++ bstart = ibstart(inode); ++ if (bstart < finfo->fi_bstart ++ && au_flag_test(sb, AuFlag_PLINK) ++ && au_is_plinked(sb, inode)) { ++ struct dentry *parent = dentry->d_parent; // dget_parent() ++ struct inode *dir = parent->d_inode, *h_dir; ++ ++ if (test_ro(sb, bstart, inode)) { ++ di_read_lock_parent(parent, !AUFS_I_RLOCK); ++ bstart = err = find_rw_parent_br(dentry, bstart); ++ //bstart = err = find_rw_br(sb, bstart); ++ di_read_unlock(parent, !AUFS_I_RLOCK); ++ //todo: err = -1; ++ if (unlikely(err < 0)) ++ goto out; ++ } ++ di_read_unlock(dentry, AUFS_I_RLOCK); ++ di_write_lock_child(dentry); ++ if (bstart != ibstart(inode)) { // todo ++ /* someone changed our inode while we were sleeping */ ++ di_downgrade_lock(dentry, AUFS_I_RLOCK); ++ goto again; ++ } ++ ++ di_read_lock_parent(parent, AUFS_I_RLOCK); ++ err = test_and_cpup_dirs(dentry, bstart, NULL); ++ ++ // always superio. ++#if 1 ++ h_dir = au_h_dptr_i(parent, bstart)->d_inode; ++ hdir_lock(h_dir, dir, bstart); ++ err = sio_cpup_simple(dentry, bstart, -1, ++ au_flags_cpup(CPUP_DTIME, parent)); ++ hdir_unlock(h_dir, dir, bstart); ++ di_read_unlock(parent, AUFS_I_RLOCK); ++#else ++ if (!is_au_wkq(current)) { ++ struct cpup_pseudo_link_args args = { ++ .errp = &err, ++ .dentry = dentry, ++ .bdst = bstart, ++ .do_lock = 1 ++ }; ++ au_wkq_wait(call_cpup_pseudo_link, &args); ++ } else ++ err = cpup_pseudo_link(dentry, bstart, /*do_lock*/1); ++#endif ++ di_downgrade_lock(dentry, AUFS_I_RLOCK); ++ if (unlikely(err)) ++ goto out; ++ } ++ ++ err = reopen(file); ++ //err = -1; ++ out_update: ++ if (!err) { ++ au_update_figen(file); ++ //DbgFile(file); ++ return 0; /* success */ ++ } ++ ++ /* error, close all hidden files */ ++ bend = fbend(file); ++ for (bindex = fbstart(file); bindex <= bend; bindex++) ++ set_h_fptr(file, bindex, NULL); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* common function to regular file and dir */ ++int au_reval_and_lock_finfo(struct file *file, int (*reopen)(struct file *file), ++ int wlock, int locked) ++{ ++ int err, sgen, fgen, pseudo_link; ++ struct dentry *dentry; ++ struct super_block *sb; ++ aufs_bindex_t bstart; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, w %d, l %d\n", DLNPair(dentry), wlock, locked); ++ sb = dentry->d_sb; ++ SiMustAnyLock(sb); ++ ++ err = 0; ++ sgen = au_sigen(sb); ++ fi_write_lock(file); ++ fgen = au_figen(file); ++ di_read_lock_child(dentry, AUFS_I_RLOCK); ++ bstart = dbstart(dentry); ++ pseudo_link = (bstart != ibstart(dentry->d_inode)); ++ di_read_unlock(dentry, AUFS_I_RLOCK); ++ if (sgen == fgen && !pseudo_link && fbstart(file) == bstart) { ++ if (!wlock) ++ fi_downgrade_lock(file); ++ return 0; /* success */ ++ } ++ ++ LKTRTrace("sgen %d, fgen %d\n", sgen, fgen); ++ if (sgen != au_digen(dentry)) { ++ /* ++ * d_path() and path_lookup() is a simple and good approach ++ * to revalidate. but si_rwsem in DEBUG_RWSEM will cause a ++ * deadlock. removed the code. ++ */ ++ di_write_lock_child(dentry); ++ err = au_reval_dpath(dentry, sgen); ++ //if (LktrCond) err = -1; ++ di_write_unlock(dentry); ++ if (unlikely(err < 0)) ++ goto out; ++ DEBUG_ON(au_digen(dentry) != sgen); ++ } ++ ++ di_read_lock_child(dentry, AUFS_I_RLOCK); ++ err = refresh_file(file, reopen); ++ //if (LktrCond) err = -1; ++ di_read_unlock(dentry, AUFS_I_RLOCK); ++ if (!err) { ++ if (!wlock) ++ fi_downgrade_lock(file); ++ } else ++ fi_write_unlock(file); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++// cf. aufs_nopage() ++// for madvise(2) ++static int aufs_readpage(struct file *file, struct page *page) ++{ ++ TraceEnter(); ++ unlock_page(page); ++ return 0; ++} ++ ++// they will never be called. ++#ifdef CONFIG_AUFS_DEBUG ++static int aufs_prepare_write(struct file *file, struct page *page, ++ unsigned from, unsigned to) ++{BUG();return 0;} ++static int aufs_commit_write(struct file *file, struct page *page, ++ unsigned from, unsigned to) ++{BUG();return 0;} ++static int aufs_writepage(struct page *page, struct writeback_control *wbc) ++{BUG();return 0;} ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,17) ++static void aufs_sync_page(struct page *page) ++{BUG();} ++#else ++static int aufs_sync_page(struct page *page) ++{BUG(); return 0;} ++#endif ++ ++#if 0 // comment ++static int aufs_writepages(struct address_space *mapping, ++ struct writeback_control *wbc) ++{BUG();return 0;} ++static int aufs_readpages(struct file *filp, struct address_space *mapping, ++ struct list_head *pages, unsigned nr_pages) ++{BUG();return 0;} ++static sector_t aufs_bmap(struct address_space *mapping, sector_t block) ++{BUG();return 0;} ++#endif ++ ++static int aufs_set_page_dirty(struct page *page) ++{BUG();return 0;} ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,17) ++static void aufs_invalidatepage (struct page *page, unsigned long offset) ++{BUG();} ++#else ++static int aufs_invalidatepage (struct page *page, unsigned long offset) ++{BUG(); return 0;} ++#endif ++static int aufs_releasepage (struct page *page, gfp_t gfp) ++{BUG();return 0;} ++static ssize_t aufs_direct_IO(int rw, struct kiocb *iocb, ++ const struct iovec *iov, loff_t offset, ++ unsigned long nr_segs) ++{BUG();return 0;} ++static struct page* aufs_get_xip_page(struct address_space *mapping, ++ sector_t offset, int create) ++{BUG();return NULL;} ++//static int aufs_migratepage (struct page *newpage, struct page *page) ++//{BUG();return 0;} ++#endif ++ ++#if 0 // comment ++struct address_space { ++ struct inode *host; /* owner: inode, block_device */ ++ struct radix_tree_root page_tree; /* radix tree of all pages */ ++ rwlock_t tree_lock; /* and rwlock protecting it */ ++ unsigned int i_mmap_writable;/* count VM_SHARED mappings */ ++ struct prio_tree_root i_mmap; /* tree of private and shared mappings */ ++ struct list_head i_mmap_nonlinear;/*list VM_NONLINEAR mappings */ ++ spinlock_t i_mmap_lock; /* protect tree, count, list */ ++ unsigned int truncate_count; /* Cover race condition with truncate */ ++ unsigned long nrpages; /* number of total pages */ ++ pgoff_t writeback_index;/* writeback starts here */ ++ struct address_space_operations *a_ops; /* methods */ ++ unsigned long flags; /* error bits/gfp mask */ ++ struct backing_dev_info *backing_dev_info; /* device readahead, etc */ ++ spinlock_t private_lock; /* for use by the address_space */ ++ struct list_head private_list; /* ditto */ ++ struct address_space *assoc_mapping; /* ditto */ ++} __attribute__((aligned(sizeof(long)))); ++ ++struct address_space_operations { ++ int (*writepage)(struct page *page, struct writeback_control *wbc); ++ int (*readpage)(struct file *, struct page *); ++ void (*sync_page)(struct page *); ++ ++ /* Write back some dirty pages from this mapping. */ ++ int (*writepages)(struct address_space *, struct writeback_control *); ++ ++ /* Set a page dirty. Return true if this dirtied it */ ++ int (*set_page_dirty)(struct page *page); ++ ++ int (*readpages)(struct file *filp, struct address_space *mapping, ++ struct list_head *pages, unsigned nr_pages); ++ ++ /* ++ * ext3 requires that a successful prepare_write() call be followed ++ * by a commit_write() call - they must be balanced ++ */ ++ int (*prepare_write)(struct file *, struct page *, unsigned, unsigned); ++ int (*commit_write)(struct file *, struct page *, unsigned, unsigned); ++ /* Unfortunately this kludge is needed for FIBMAP. Don't use it */ ++ sector_t (*bmap)(struct address_space *, sector_t); ++ void (*invalidatepage) (struct page *, unsigned long); ++ int (*releasepage) (struct page *, gfp_t); ++ ssize_t (*direct_IO)(int, struct kiocb *, const struct iovec *iov, ++ loff_t offset, unsigned long nr_segs); ++ struct page* (*get_xip_page)(struct address_space *, sector_t, ++ int); ++ /* migrate the contents of a page to the specified target */ ++ int (*migratepage) (struct page *, struct page *); ++}; ++#endif ++ ++struct address_space_operations aufs_aop = { ++ .readpage = aufs_readpage, ++#ifdef CONFIG_AUFS_DEBUG ++ .writepage = aufs_writepage, ++ .sync_page = aufs_sync_page, ++ //.writepages = aufs_writepages, ++ .set_page_dirty = aufs_set_page_dirty, ++ //.readpages = aufs_readpages, ++ .prepare_write = aufs_prepare_write, ++ .commit_write = aufs_commit_write, ++ //.bmap = aufs_bmap, ++ .invalidatepage = aufs_invalidatepage, ++ .releasepage = aufs_releasepage, ++ .direct_IO = aufs_direct_IO, ++ .get_xip_page = aufs_get_xip_page, ++ //.migratepage = aufs_migratepage ++#endif ++}; +diff --git a/fs/aufs/file.h b/fs/aufs/file.h +new file mode 100755 +index 0000000..f0fa448 +--- /dev/null ++++ b/fs/aufs/file.h +@@ -0,0 +1,140 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: file.h,v 1.25 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_FILE_H__ ++#define __AUFS_FILE_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/file.h> ++#include <linux/fs.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++#include "misc.h" ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++// SEEK_xxx are defined in linux/fs.h ++#else ++enum {SEEK_SET, SEEK_CUR, SEEK_END}; ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct aufs_branch; ++struct aufs_hfile { ++ struct file *hf_file; ++ struct aufs_branch *hf_br; ++}; ++ ++struct aufs_vdir; ++struct aufs_finfo { ++ atomic_t fi_generation; ++ ++ struct aufs_rwsem fi_rwsem; ++ struct aufs_hfile *fi_hfile; ++ aufs_bindex_t fi_bstart, fi_bend; ++ ++ union { ++ struct vm_operations_struct *fi_h_vm_ops; ++ struct aufs_vdir *fi_vdir_cache; ++ }; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* file.c */ ++extern struct address_space_operations aufs_aop; ++unsigned int au_file_roflags(unsigned int flags); ++struct file *hidden_open(struct dentry *dentry, aufs_bindex_t bindex, ++ int flags); ++int au_do_open(struct inode *inode, struct file *file, ++ int (*open)(struct file *file, int flags)); ++int au_reopen_nondir(struct file *file); ++int au_ready_to_write(struct file *file, loff_t len); ++int au_reval_and_lock_finfo(struct file *file, int (*reopen)(struct file *file), ++ int wlock, int locked); ++ ++/* f_op.c */ ++extern struct file_operations aufs_file_fop; ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++int aufs_flush(struct file *file, fl_owner_t id); ++#else ++int aufs_flush(struct file *file); ++#endif ++ ++/* finfo.c */ ++struct aufs_finfo *ftofi(struct file *file); ++aufs_bindex_t fbstart(struct file *file); ++aufs_bindex_t fbend(struct file *file); ++struct aufs_vdir *fvdir_cache(struct file *file); ++struct aufs_branch *ftobr(struct file *file, aufs_bindex_t bindex); ++struct file *au_h_fptr_i(struct file *file, aufs_bindex_t bindex); ++struct file *au_h_fptr(struct file *file); ++ ++void set_fbstart(struct file *file, aufs_bindex_t bindex); ++void set_fbend(struct file *file, aufs_bindex_t bindex); ++void set_fvdir_cache(struct file *file, struct aufs_vdir *vdir_cache); ++void au_hfput(struct aufs_hfile *hf); ++void set_h_fptr(struct file *file, aufs_bindex_t bindex, struct file *h_file); ++void au_update_figen(struct file *file); ++ ++void au_fin_finfo(struct file *file); ++int au_init_finfo(struct file *file); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline int au_figen(struct file *f) ++{ ++ return atomic_read(&ftofi(f)->fi_generation); ++} ++ ++static inline int au_is_mmapped(struct file *f) ++{ ++ return !!(ftofi(f)->fi_h_vm_ops); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * fi_read_lock, fi_write_lock, ++ * fi_read_unlock, fi_write_unlock, fi_downgrade_lock ++ */ ++SimpleRwsemFuncs(fi, struct file *f, ftofi(f)->fi_rwsem); ++ ++/* to debug easier, do not make them inlined functions */ ++#define FiMustReadLock(f) do {\ ++ SiMustAnyLock((f)->f_dentry->d_sb); \ ++ RwMustReadLock(&ftofi(f)->fi_rwsem); \ ++} while (0) ++ ++#define FiMustWriteLock(f) do { \ ++ SiMustAnyLock((f)->f_dentry->d_sb); \ ++ RwMustWriteLock(&ftofi(f)->fi_rwsem); \ ++} while (0) ++ ++#define FiMustAnyLock(f) do { \ ++ SiMustAnyLock((f)->f_dentry->d_sb); \ ++ RwMustAnyLock(&ftofi(f)->fi_rwsem); \ ++} while (0) ++ ++#define FiMustNoWaiters(f) RwMustNoWaiters(&ftofi(f)->fi_rwsem) ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_FILE_H__ */ +diff --git a/fs/aufs/finfo.c b/fs/aufs/finfo.c +new file mode 100755 +index 0000000..1e09da8 +--- /dev/null ++++ b/fs/aufs/finfo.c +@@ -0,0 +1,211 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: finfo.c,v 1.23 2007/04/30 05:45:21 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++struct aufs_finfo *ftofi(struct file *file) ++{ ++ struct aufs_finfo *finfo = file->private_data; ++ DEBUG_ON(!finfo ++ || !finfo->fi_hfile ++ || (0 < finfo->fi_bend ++ && (/* stosi(file->f_dentry->d_sb)->si_bend ++ < finfo->fi_bend ++ || */ finfo->fi_bend < finfo->fi_bstart))); ++ return finfo; ++} ++ ++// hard/soft set ++aufs_bindex_t fbstart(struct file *file) ++{ ++ FiMustAnyLock(file); ++ return ftofi(file)->fi_bstart; ++} ++ ++aufs_bindex_t fbend(struct file *file) ++{ ++ FiMustAnyLock(file); ++ return ftofi(file)->fi_bend; ++} ++ ++struct aufs_vdir *fvdir_cache(struct file *file) ++{ ++ FiMustAnyLock(file); ++ return ftofi(file)->fi_vdir_cache; ++} ++ ++struct aufs_branch *ftobr(struct file *file, aufs_bindex_t bindex) ++{ ++ struct aufs_finfo *finfo = ftofi(file); ++ struct aufs_hfile *hf; ++ ++ FiMustAnyLock(file); ++ DEBUG_ON(!finfo ++ || finfo->fi_bstart < 0 ++ || bindex < finfo->fi_bstart ++ || finfo->fi_bend < bindex); ++ hf = finfo->fi_hfile + bindex; ++ DEBUG_ON(hf->hf_br && br_count(hf->hf_br) <= 0); ++ return hf->hf_br; ++} ++ ++struct file *au_h_fptr_i(struct file *file, aufs_bindex_t bindex) ++{ ++ struct aufs_finfo *finfo = ftofi(file); ++ struct aufs_hfile *hf; ++ ++ FiMustAnyLock(file); ++ DEBUG_ON(!finfo ++ || finfo->fi_bstart < 0 ++ || bindex < finfo->fi_bstart ++ || finfo->fi_bend < bindex); ++ hf = finfo->fi_hfile + bindex; ++ DEBUG_ON(hf->hf_file ++ && file_count(hf->hf_file) <= 0 ++ && br_count(hf->hf_br) <= 0); ++ return hf->hf_file; ++} ++ ++struct file *au_h_fptr(struct file *file) ++{ ++ return au_h_fptr_i(file, fbstart(file)); ++} ++ ++void set_fbstart(struct file *file, aufs_bindex_t bindex) ++{ ++ FiMustWriteLock(file); ++ DEBUG_ON(sbend(file->f_dentry->d_sb) < bindex); ++ ftofi(file)->fi_bstart = bindex; ++} ++ ++void set_fbend(struct file *file, aufs_bindex_t bindex) ++{ ++ FiMustWriteLock(file); ++ DEBUG_ON(sbend(file->f_dentry->d_sb) < bindex ++ || bindex < fbstart(file)); ++ ftofi(file)->fi_bend = bindex; ++} ++ ++void set_fvdir_cache(struct file *file, struct aufs_vdir *vdir_cache) ++{ ++ FiMustWriteLock(file); ++ DEBUG_ON(!S_ISDIR(file->f_dentry->d_inode->i_mode) ++ || (ftofi(file)->fi_vdir_cache && vdir_cache)); ++ ftofi(file)->fi_vdir_cache = vdir_cache; ++} ++ ++void au_hfput(struct aufs_hfile *hf) ++{ ++ fput(hf->hf_file); ++ hf->hf_file = NULL; ++ DEBUG_ON(!hf->hf_br); ++ br_put(hf->hf_br); ++ hf->hf_br = NULL; ++} ++ ++void set_h_fptr(struct file *file, aufs_bindex_t bindex, struct file *val) ++{ ++ struct aufs_finfo *finfo = ftofi(file); ++ struct aufs_hfile *hf; ++ ++ FiMustWriteLock(file); ++ DEBUG_ON(!finfo ++ || finfo->fi_bstart < 0 ++ || bindex < finfo->fi_bstart ++ || finfo->fi_bend < bindex); ++ DEBUG_ON(val && file_count(val) <= 0); ++ hf = finfo->fi_hfile + bindex; ++ DEBUG_ON(val && hf->hf_file); ++ if (hf->hf_file) ++ au_hfput(hf); ++ if (val) { ++ hf->hf_file = val; ++ hf->hf_br = stobr(file->f_dentry->d_sb, bindex); ++ } ++} ++ ++void au_update_figen(struct file *file) ++{ ++ atomic_set(&ftofi(file)->fi_generation, au_digen(file->f_dentry)); ++} ++ ++void au_fin_finfo(struct file *file) ++{ ++ struct aufs_finfo *finfo; ++ struct dentry *dentry; ++ aufs_bindex_t bindex, bend; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ SiMustAnyLock(dentry->d_sb); ++ ++ fi_write_lock(file); ++ bend = fbend(file); ++ bindex = fbstart(file); ++ if (bindex >= 0) ++ for (; bindex <= bend; bindex++) ++ set_h_fptr(file, bindex, NULL); ++ ++ finfo = ftofi(file); ++#ifdef CONFIG_AUFS_DEBUG ++ if (finfo->fi_bstart >= 0) { ++ bend = fbend(file); ++ for (bindex = finfo->fi_bstart; bindex <= bend; bindex++) { ++ struct aufs_hfile *hf; ++ hf = finfo->fi_hfile + bindex; ++ DEBUG_ON(hf->hf_file || hf->hf_br); ++ } ++ } ++#endif ++ ++ kfree(finfo->fi_hfile); ++ fi_write_unlock(file); ++ cache_free_finfo(finfo); ++ //file->private_data = NULL; ++} ++ ++int au_init_finfo(struct file *file) ++{ ++ struct aufs_finfo *finfo; ++ struct dentry *dentry; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ DEBUG_ON(!dentry->d_inode); ++ ++ finfo = cache_alloc_finfo(); ++ if (finfo) { ++ finfo->fi_hfile = kcalloc(sbend(dentry->d_sb) + 1, ++ sizeof(*finfo->fi_hfile), GFP_KERNEL); ++ if (finfo->fi_hfile) { ++ rw_init_wlock(&finfo->fi_rwsem); ++ finfo->fi_bstart = -1; ++ finfo->fi_bend = -1; ++ atomic_set(&finfo->fi_generation, au_digen(dentry)); ++ ++ file->private_data = finfo; ++ return 0; /* success */ ++ } ++ cache_free_finfo(finfo); ++ } ++ ++ TraceErr(-ENOMEM); ++ return -ENOMEM; ++} +diff --git a/fs/aufs/hinotify.c b/fs/aufs/hinotify.c +new file mode 100755 +index 0000000..3bad3f7 +--- /dev/null ++++ b/fs/aufs/hinotify.c +@@ -0,0 +1,536 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: hinotify.c,v 1.19 2007/05/14 03:39:21 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++static struct inotify_handle *in_handle; ++static const __u32 in_mask = (IN_MOVE | IN_DELETE | IN_CREATE /* | IN_ACCESS */ ++ | IN_MODIFY | IN_ATTRIB ++ | IN_DELETE_SELF | IN_MOVE_SELF); ++ ++int alloc_hinotify(struct aufs_hinode *hinode, struct inode *inode, ++ struct inode *hidden_inode) ++{ ++ int err; ++ struct aufs_hinotify *hin; ++ s32 wd; ++ ++ LKTRTrace("i%lu, hi%lu\n", inode->i_ino, hidden_inode->i_ino); ++ ++ err = -ENOMEM; ++ hin = cache_alloc_hinotify(); ++ if (hin) { ++ DEBUG_ON(hinode->hi_notify); ++ hinode->hi_notify = hin; ++ hin->hin_aufs_inode = inode; ++ inotify_init_watch(&hin->hin_watch); ++ wd = inotify_add_watch(in_handle, &hin->hin_watch, hidden_inode, ++ in_mask); ++ if (wd >= 0) ++ return 0; /* success */ ++ ++ err = wd; ++ put_inotify_watch(&hin->hin_watch); ++ cache_free_hinotify(hin); ++ hinode->hi_notify = NULL; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++void do_free_hinotify(struct aufs_hinode *hinode) ++{ ++ int err; ++ struct aufs_hinotify *hin; ++ ++ TraceEnter(); ++ ++ hin = hinode->hi_notify; ++ if (hin) { ++ err = 0; ++ if (atomic_read(&hin->hin_watch.count)) ++ err = inotify_rm_watch(in_handle, &hin->hin_watch); ++ ++ if (!err) { ++ cache_free_hinotify(hin); ++ hinode->hi_notify = NULL; ++ } else ++ IOErr1("failed inotify_rm_watch() %d\n", err); ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void ctl_hinotify(struct aufs_hinode *hinode, const __u32 mask) ++{ ++ struct inode *hi; ++ struct inotify_watch *watch; ++ ++ hi = hinode->hi_inode; ++ LKTRTrace("hi%lu, sb %p, 0x%x\n", hi->i_ino, hi->i_sb, mask); ++ if (0 && !strcmp(current->comm, "link")) ++ dump_stack(); ++ IMustLock(hi); ++ if (!hinode->hi_notify) ++ return; ++ ++ watch = &hinode->hi_notify->hin_watch; ++#if 0 ++ { ++ u32 wd; ++ wd = inotify_find_update_watch(in_handle, hi, mask); ++ TraceErr(wd); ++ // ignore an err; ++ } ++#else ++ watch->mask = mask; ++ smp_mb(); ++#endif ++ LKTRTrace("watch %p, mask %u\n", watch, watch->mask); ++} ++ ++#define suspend_hinotify(hi) ctl_hinotify(hi, 0) ++#define resume_hinotify(hi) ctl_hinotify(hi, in_mask) ++ ++void do_hdir_lock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex, ++ unsigned int lsc) ++{ ++ struct aufs_hinode *hinode; ++ ++ LKTRTrace("i%lu, b%d, lsc %d\n", dir->i_ino, bindex, lsc); ++ DEBUG_ON(!S_ISDIR(dir->i_mode)); ++ hinode = itoii(dir)->ii_hinode + bindex; ++ DEBUG_ON(h_dir != hinode->hi_inode); ++ ++ hi_lock(h_dir, lsc); ++ if (1 /* unlikely(au_flag_test(dir->i_sb, AuFlag_UDBA_HINOTIFY) */) ++ suspend_hinotify(hinode); ++} ++ ++void hdir_unlock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex) ++{ ++ struct aufs_hinode *hinode; ++ ++ LKTRTrace("i%lu, b%d\n", dir->i_ino, bindex); ++ DEBUG_ON(!S_ISDIR(dir->i_mode)); ++ hinode = itoii(dir)->ii_hinode + bindex; ++ DEBUG_ON(h_dir != hinode->hi_inode); ++ ++ if (1 /* unlikely(au_flag_test(dir->i_sb, AuFlag_UDBA_HINOTIFY) */) ++ resume_hinotify(hinode); ++ i_unlock(h_dir); ++} ++ ++void hdir_lock_rename(struct dentry **h_parents, struct inode **dirs, ++ aufs_bindex_t bindex, int issamedir) ++{ ++ struct aufs_hinode *hinode; ++ ++ LKTRTrace("%.*s, %.*s\n", DLNPair(h_parents[0]), DLNPair(h_parents[1])); ++ ++ vfsub_lock_rename(h_parents[0], h_parents[1]); ++ hinode = itoii(dirs[0])->ii_hinode + bindex; ++ DEBUG_ON(h_parents[0]->d_inode != hinode->hi_inode); ++ suspend_hinotify(hinode); ++ if (issamedir) ++ return; ++ hinode = itoii(dirs[1])->ii_hinode + bindex; ++ DEBUG_ON(h_parents[1]->d_inode != hinode->hi_inode); ++ suspend_hinotify(hinode); ++} ++ ++void hdir_unlock_rename(struct dentry **h_parents, struct inode **dirs, ++ aufs_bindex_t bindex, int issamedir) ++{ ++ struct aufs_hinode *hinode; ++ ++ LKTRTrace("%.*s, %.*s\n", DLNPair(h_parents[0]), DLNPair(h_parents[1])); ++ ++ hinode = itoii(dirs[0])->ii_hinode + bindex; ++ DEBUG_ON(h_parents[0]->d_inode != hinode->hi_inode); ++ resume_hinotify(hinode); ++ if (!issamedir) { ++ hinode = itoii(dirs[1])->ii_hinode + bindex; ++ DEBUG_ON(h_parents[1]->d_inode != hinode->hi_inode); ++ resume_hinotify(hinode); ++ } ++ vfsub_unlock_rename(h_parents[0], h_parents[1]); ++} ++ ++void au_reset_hinotify(struct inode *inode, unsigned int flags) ++{ ++ aufs_bindex_t bindex, bend; ++ struct inode *hi; ++ ++ LKTRTrace("i%lu, 0x%x\n", inode->i_ino, flags); ++ ++ bend = ibend(inode); ++ for (bindex = ibstart(inode); bindex <= bend; bindex++) { ++ hi = au_h_iptr_i(inode, bindex); ++ if (hi) { ++ //hi_lock(hi, AUFS_LSC_H_CHILD); ++ igrab(hi); ++ set_h_iptr(inode, bindex, NULL, 0); ++ set_h_iptr(inode, bindex, igrab(hi), flags); ++ iput(hi); ++ //i_unlock(hi); ++ } ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_DEBUG ++static char *in_name(u32 mask) ++{ ++#define test_ret(flag) if (mask & flag) return #flag; ++ test_ret(IN_ACCESS); ++ test_ret(IN_MODIFY); ++ test_ret(IN_ATTRIB); ++ test_ret(IN_CLOSE_WRITE); ++ test_ret(IN_CLOSE_NOWRITE); ++ test_ret(IN_OPEN); ++ test_ret(IN_MOVED_FROM); ++ test_ret(IN_MOVED_TO); ++ test_ret(IN_CREATE); ++ test_ret(IN_DELETE); ++ test_ret(IN_DELETE_SELF); ++ test_ret(IN_MOVE_SELF); ++ test_ret(IN_UNMOUNT); ++ test_ret(IN_Q_OVERFLOW); ++ test_ret(IN_IGNORED); ++ return ""; ++#undef test_ret ++} ++#else ++#define in_name(m) "??" ++#endif ++ ++static int dec_gen_by_name(struct inode *dir, const char *_name, u32 mask) ++{ ++ int err; ++ struct dentry *parent, *child; ++ struct inode *inode; ++ struct qstr *dname; ++ char *name = (void*)_name; ++ unsigned int len; ++ ++ LKTRTrace("i%lu, %s, 0x%x %s\n", ++ dir->i_ino, name, mask, in_name(mask)); ++ ++ err = -1; ++ parent = d_find_alias(dir); ++ if (unlikely(!parent)) ++ goto out; ++ ++#if 0 ++ if (unlikely(!memcmp(name, AUFS_WH_PFX, AUFS_WH_PFX_LEN))) ++ name += AUFS_WH_PFX_LEN; ++#endif ++ len = strlen(name); ++ spin_lock(&dcache_lock); ++ list_for_each_entry(child, &parent->d_subdirs, d_u.d_child) { ++ dname = &child->d_name; ++ if (len == dname->len && !memcmp(dname->name, name, len)) { ++ au_digen_dec(child); ++#if 1 ++ //todo: why both are needed ++ if (mask & IN_MOVE) { ++ spin_lock(&child->d_lock); ++ __d_drop(child); ++ spin_unlock(&child->d_lock); ++ } ++#endif ++ ++ inode = child->d_inode; ++ if (inode) ++ au_iigen_dec(inode); ++ err = !!inode; ++ ++ // todo: the i_nlink of newly created name by link(2) ++ // should be updated ++ // todo: some nfs dentry doesn't notified at deleteing ++ break; ++ } ++ } ++ spin_unlock(&dcache_lock); ++ dput(parent); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++struct postproc_args { ++ struct inode *h_dir, *dir, *h_child_inode; ++ char *h_child_name; ++ u32 mask; ++}; ++ ++static void dec_gen_by_ino(struct postproc_args *a) ++{ ++ struct super_block *sb; ++ aufs_bindex_t bindex, bend, bfound; ++ struct xino xino; ++ struct inode *cinode; ++ ++ TraceEnter(); ++ ++ sb = a->dir->i_sb; ++ DEBUG_ON(!au_flag_test(sb, AuFlag_XINO)); ++ ++ bfound = -1; ++ bend = ibend(a->dir); ++ for (bindex = ibstart(a->dir); bfound == -1 && bindex <= bend; bindex++) ++ if (au_h_iptr_i(a->dir, bindex) == a->h_dir) ++ bfound = bindex; ++ if (bfound < 0) ++ return; ++ ++ bindex = find_brindex(sb, itoii(a->dir)->ii_hinode[bfound + 0].hi_id); ++ if (bindex < 0) ++ return; ++ if (unlikely(xino_read(sb, bindex, a->h_child_inode->i_ino, &xino))) ++ return; ++ cinode = NULL; ++ if (xino.ino) ++ cinode = ilookup(sb, xino.ino); ++ if (cinode) { ++#if 1 ++ if (1 || a->mask & IN_MOVE) { ++ struct dentry *child; ++ spin_lock(&dcache_lock); ++ list_for_each_entry(child, &cinode->i_dentry, d_alias) ++ au_digen_dec(child); ++ spin_unlock(&dcache_lock); ++ } ++#endif ++ au_iigen_dec(cinode); ++ iput(cinode); ++ } ++} ++ ++static void reset_ino(struct postproc_args *a) ++{ ++ aufs_bindex_t bindex, bend; ++ struct super_block *sb; ++ struct inode *h_dir; ++ ++ sb = a->dir->i_sb; ++ bend = ibend(a->dir); ++ for (bindex = ibstart(a->dir); bindex <= bend; bindex++) { ++ h_dir = au_h_iptr_i(a->dir, bindex); ++ if (h_dir && h_dir != a->h_dir) ++ xino_write0(sb, bindex, h_dir->i_ino); ++ /* ignore this error */ ++ } ++} ++ ++static void postproc(void *args) ++{ ++ struct postproc_args *a = args; ++ struct super_block *sb; ++ struct aufs_vdir *vdir; ++ ++ //au_debug_on(); ++ LKTRTrace("mask 0x%x %s, i%lu, hi%lu, hci%lu\n", ++ a->mask, in_name(a->mask), a->dir->i_ino, a->h_dir->i_ino, ++ a->h_child_inode ? a->h_child_inode->i_ino : 0); ++ DEBUG_ON(!a->dir); ++#if 0//def ForceInotify ++ Dbg("mask 0x%x %s, i%lu, hi%lu, hci%lu\n", ++ a->mask, in_name(a->mask), a->dir->i_ino, a->h_dir->i_ino, ++ a->h_child_inode ? a->h_child_inode->i_ino : 0); ++#endif ++ ++ i_lock(a->dir); ++ sb = a->dir->i_sb; ++ si_read_lock(sb); // consider write_lock ++ ii_write_lock_parent(a->dir); ++ ++ /* make dir entries obsolete */ ++ vdir = ivdir(a->dir); ++ if (vdir) ++ vdir->vd_jiffy = 0; ++ a->dir->i_version++; ++ ++ /* ++ * special handling root directory, ++ * sine d_revalidate may not be called later. ++ * main purpose is maintaining i_nlink. ++ */ ++ if (unlikely(a->dir->i_ino == AUFS_ROOT_INO)) ++ au_cpup_attr_all(a->dir); ++ ++ if (a->h_child_inode && au_flag_test(sb, AuFlag_XINO)) ++ dec_gen_by_ino(a); ++ else if (a->mask & (IN_MOVE_SELF | IN_DELETE_SELF)) ++ reset_ino(a); ++ ++ ii_write_unlock(a->dir); ++ si_read_unlock(sb); ++ i_unlock(a->dir); ++ ++ au_mntput(a->dir->i_sb); ++ iput(a->h_child_inode); ++ iput(a->h_dir); ++ iput(a->dir); ++#if 0 ++ if (atomic_dec_and_test(&stosi(sb)->si_hinotify)) ++ wake_up_all(&stosi(sb)->si_hinotify_wq); ++#endif ++ kfree(a); ++ //au_debug_off(); ++} ++ ++static void aufs_inotify(struct inotify_watch *watch, u32 wd, u32 mask, ++ u32 cookie, const char *h_child_name, ++ struct inode *h_child_inode) ++{ ++ struct aufs_hinotify *hinotify; ++ struct postproc_args *args; ++ int len; ++ char *p; ++ struct inode *dir; ++ //static DECLARE_WAIT_QUEUE_HEAD(wq); ++ ++ //au_debug_on(); ++ LKTRTrace("i%lu, wd %d, mask 0x%x %s, cookie 0x%x, hcname %s, hi%lu\n", ++ watch->inode->i_ino, wd, mask, in_name(mask), cookie, ++ h_child_name ? h_child_name : "", ++ h_child_inode ? h_child_inode->i_ino : 0); ++ //au_debug_off(); ++ //IMustLock(h_dir); ++#if 0 //defined(ForceInotify) || defined(DbgInotify) ++ Dbg("i%lu, wd %d, mask 0x%x %s, cookie 0x%x, hcname %s, hi%lu\n", ++ watch->inode->i_ino, wd, mask, in_name(mask), cookie, ++ h_child_name ? h_child_name : "", ++ h_child_inode ? h_child_inode->i_ino : 0); ++#endif ++ /* if IN_UNMOUNT happens, there must be another bug */ ++ if (mask & (IN_IGNORED | IN_UNMOUNT)) { ++ put_inotify_watch(watch); ++ return; ++ } ++ ++ switch (mask & IN_ALL_EVENTS) { ++ case IN_MODIFY: ++ case IN_ATTRIB: ++ if (h_child_name) ++ return; ++ break; ++ ++ case IN_MOVED_FROM: ++ case IN_MOVED_TO: ++ case IN_CREATE: ++ DEBUG_ON(!h_child_name || !h_child_inode); ++ break; ++ case IN_DELETE: ++ /* ++ * aufs never be able to get this child inode. ++ * revalidation should be in d_revalide() ++ * by checking i_nlink, i_generation or d_unhashed(). ++ */ ++ DEBUG_ON(!h_child_name); ++ break; ++ ++ case IN_DELETE_SELF: ++ case IN_MOVE_SELF: ++ DEBUG_ON(h_child_name || h_child_inode); ++ break; ++ ++ case IN_ACCESS: ++ default: ++ DEBUG_ON(1); ++ } ++ ++#ifdef DbgInotify ++ WARN_ON(1); ++#endif ++ ++ /* iput() will be called in postproc() */ ++ hinotify = container_of(watch, struct aufs_hinotify, hin_watch); ++ DEBUG_ON(!hinotify || !hinotify->hin_aufs_inode); ++ dir = hinotify->hin_aufs_inode; ++ ++ /* force re-lookup in next d_revalidate() */ ++ if (dir->i_ino != AUFS_ROOT_INO) ++ au_iigen_dec(dir); ++ len = 0; ++ if (h_child_name && dec_gen_by_name(dir, h_child_name, mask)) ++ len = strlen(h_child_name); ++ ++ //wait_event(wq, (args = kmalloc(sizeof(*args), GFP_KERNEL))); ++ args = kmalloc(sizeof(*args) + len + 1, GFP_KERNEL); ++ if (unlikely(!args)) { ++ Err("no memory\n"); ++ return; ++ } ++ args->mask = mask; ++ args->dir = igrab(dir); ++ args->h_dir = igrab(watch->inode); ++ args->h_child_inode = NULL; ++ if (len) { ++ if (h_child_inode) ++ args->h_child_inode = igrab(h_child_inode); ++ p = (void*)args; ++ args->h_child_name = p + sizeof(*args); ++ memcpy(args->h_child_name, h_child_name, len + 1); ++ } ++ //atomic_inc(&stosi(args->dir->i_sb)->si_hinotify); ++ /* prohibit umount */ ++ au_mntget(args->dir->i_sb); ++ au_wkq_nowait(postproc, args, /*dlgt*/0); ++} ++ ++#if 0 ++void hinotify_flush(struct super_block *sb) ++{ ++ atomic_t *p = &stosi(sb)->si_hinotify; ++ wait_event(stosi(sb)->si_hinotify_wq, !atomic_read(p)); ++} ++#endif ++ ++static void aufs_inotify_destroy(struct inotify_watch *watch) ++{ ++ return; ++} ++ ++static struct inotify_operations aufs_inotify_ops = { ++ .handle_event = aufs_inotify, ++ .destroy_watch = aufs_inotify_destroy ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++int __init au_inotify_init(void) ++{ ++ in_handle = inotify_init(&aufs_inotify_ops); ++ if (!IS_ERR(in_handle)) ++ return 0; ++ TraceErrPtr(in_handle); ++ return PTR_ERR(in_handle); ++} ++ ++void au_inotify_fin(void) ++{ ++ inotify_destroy(in_handle); ++} +diff --git a/fs/aufs/i_op.c b/fs/aufs/i_op.c +new file mode 100755 +index 0000000..1cd0453 +--- /dev/null ++++ b/fs/aufs/i_op.c +@@ -0,0 +1,641 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: i_op.c,v 1.30 2007/04/23 00:55:05 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++//#include <linux/namei.h> ++#include <linux/security.h> ++#include <asm/uaccess.h> ++#include "aufs.h" ++ ++#ifdef CONFIG_AUFS_DLGT ++struct security_inode_permission_args { ++ int *errp; ++ struct inode *h_inode; ++ int mask; ++ struct nameidata *fake_nd; ++}; ++ ++static void call_security_inode_permission(void *args) ++{ ++ struct security_inode_permission_args *a = args; ++ LKTRTrace("fsuid %d\n", current->fsuid); ++ *a->errp = security_inode_permission(a->h_inode, a->mask, a->fake_nd); ++} ++#endif ++ ++static int hidden_permission(struct inode *hidden_inode, int mask, ++ struct nameidata *fake_nd, int brperm, int dlgt) ++{ ++ int err, submask; ++ const int write_mask = (mask & (MAY_WRITE | MAY_APPEND)); ++ ++ LKTRTrace("ino %lu, mask 0x%x, brperm 0x%x\n", ++ hidden_inode->i_ino, mask, brperm); ++ ++ err = -EACCES; ++ if (unlikely(write_mask && IS_IMMUTABLE(hidden_inode))) ++ goto out; ++ ++ /* skip hidden fs test in the case of write to ro branch */ ++ submask = mask & ~MAY_APPEND; ++ if (unlikely((write_mask && !br_writable(brperm)) ++ || !hidden_inode->i_op ++ || !hidden_inode->i_op->permission)) { ++ //LKTRLabel(generic_permission); ++ err = generic_permission(hidden_inode, submask, NULL); ++ } else { ++ //LKTRLabel(h_inode->permission); ++ err = hidden_inode->i_op->permission(hidden_inode, submask, ++ fake_nd); ++ TraceErr(err); ++ } ++ ++#if 1 ++ if (!err) { ++#ifndef CONFIG_AUFS_DLGT ++ err = security_inode_permission(hidden_inode, mask, fake_nd); ++#else ++ if (!dlgt) ++ err = security_inode_permission(hidden_inode, mask, ++ fake_nd); ++ else { ++ struct security_inode_permission_args args = { ++ .errp = &err, ++ .h_inode = hidden_inode, ++ .mask = mask, ++ .fake_nd = fake_nd ++ }; ++ au_wkq_wait(call_security_inode_permission, &args, ++ /*dlgt*/1); ++ } ++#endif ++ } ++#endif ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static int silly_lock(struct inode *inode, struct nameidata *nd) ++{ ++ int locked = 0; ++ struct super_block *sb = inode->i_sb; ++ ++ LKTRTrace("i%lu, nd %p\n", inode->i_ino, nd); ++ ++#ifdef CONFIG_AUFS_FAKE_DM ++ si_read_lock(sb); ++ ii_read_lock_child(inode); ++#else ++ if (!nd || !nd->dentry) { ++ si_read_lock(sb); ++ ii_read_lock_child(inode); ++ } else if (nd->dentry->d_inode != inode) { ++ locked = 1; ++ /* lock child first, then parent */ ++ si_read_lock(sb); ++ ii_read_lock_child(inode); ++ di_read_lock_parent(nd->dentry, 0); ++ } else { ++ locked = 2; ++ aufs_read_lock(nd->dentry, AUFS_I_RLOCK); ++ } ++#endif ++ return locked; ++} ++ ++static void silly_unlock(int locked, struct inode *inode, struct nameidata *nd) ++{ ++ struct super_block *sb = inode->i_sb; ++ ++ LKTRTrace("locked %d, i%lu, nd %p\n", locked, inode->i_ino, nd); ++ ++#ifdef CONFIG_AUFS_FAKE_DM ++ ii_read_unlock(inode); ++ si_read_unlock(sb); ++#else ++ switch (locked) { ++ case 0: ++ ii_read_unlock(inode); ++ si_read_unlock(sb); ++ break; ++ case 1: ++ di_read_unlock(nd->dentry, 0); ++ ii_read_unlock(inode); ++ si_read_unlock(sb); ++ break; ++ case 2: ++ aufs_read_unlock(nd->dentry, AUFS_I_RLOCK); ++ break; ++ default: ++ BUG(); ++ } ++#endif ++} ++ ++static int aufs_permission(struct inode *inode, int mask, struct nameidata *nd) ++{ ++ int err, locked, dlgt; ++ aufs_bindex_t bindex, bend; ++ struct inode *hidden_inode; ++ struct super_block *sb; ++ struct nameidata fake_nd, *p; ++ const int write_mask = (mask & (MAY_WRITE | MAY_APPEND)); ++ const int nondir = !S_ISDIR(inode->i_mode); ++ ++ LKTRTrace("ino %lu, mask 0x%x, nondir %d, write_mask %d, " ++ "nd %p{%p, %p}\n", ++ inode->i_ino, mask, nondir, write_mask, ++ nd, nd ? nd->dentry : NULL, nd ? nd->mnt : NULL); ++ ++ sb = inode->i_sb; ++ locked = silly_lock(inode, nd); ++ dlgt = need_dlgt(sb); ++ ++ if (nd) ++ fake_nd = *nd; ++ if (/* unlikely */(nondir || write_mask)) { ++ hidden_inode = au_h_iptr(inode); ++ DEBUG_ON(!hidden_inode ++ || ((hidden_inode->i_mode & S_IFMT) ++ != (inode->i_mode & S_IFMT))); ++ err = 0; ++ bindex = ibstart(inode); ++ p = fake_dm(&fake_nd, nd, sb, bindex); ++ /* actual test will be delegated to LSM */ ++ if (IS_ERR(p)) ++ DEBUG_ON(PTR_ERR(p) != -ENOENT); ++ else { ++ err = hidden_permission(hidden_inode, mask, p, ++ sbr_perm(sb, bindex), dlgt); ++ fake_dm_release(p); ++ } ++ if (write_mask && !err) { ++ err = find_rw_br(sb, bindex); ++ if (err >= 0) ++ err = 0; ++ } ++ goto out; ++ } ++ ++ /* non-write to dir */ ++ err = 0; ++ bend = ibend(inode); ++ for (bindex = ibstart(inode); !err && bindex <= bend; bindex++) { ++ hidden_inode = au_h_iptr_i(inode, bindex); ++ if (!hidden_inode) ++ continue; ++ DEBUG_ON(!S_ISDIR(hidden_inode->i_mode)); ++ ++ p = fake_dm(&fake_nd, nd, sb, bindex); ++ /* actual test will be delegated to LSM */ ++ if (IS_ERR(p)) ++ DEBUG_ON(PTR_ERR(p) != -ENOENT); ++ else { ++ err = hidden_permission(hidden_inode, mask, p, ++ sbr_perm(sb, bindex), dlgt); ++ fake_dm_release(p); ++ } ++ } ++ ++ out: ++ silly_unlock(locked, inode, nd); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static struct dentry *aufs_lookup(struct inode *dir, struct dentry *dentry, ++ struct nameidata *nd) ++{ ++ struct dentry *ret, *parent; ++ int err, npositive; ++ struct inode *inode; ++ ++ LKTRTrace("dir %lu, %.*s\n", dir->i_ino, DLNPair(dentry)); ++ DEBUG_ON(IS_ROOT(dentry)); ++ IMustLock(dir); ++ ++ parent = dentry->d_parent; // dget_parent() ++ aufs_read_lock(parent, !AUFS_I_RLOCK); ++ err = au_alloc_dinfo(dentry); ++ //if (LktrCond) err = -1; ++ ret = ERR_PTR(err); ++ if (unlikely(err)) ++ goto out; ++ ++ err = npositive = lkup_dentry(dentry, dbstart(parent), /*type*/0); ++ //err = -1; ++ ret = ERR_PTR(err); ++ if (unlikely(err < 0)) ++ goto out_unlock; ++ inode = NULL; ++ if (npositive) { ++ inode = au_new_inode(dentry); ++ ret = (void*)inode; ++ } ++ if (!IS_ERR(inode)) { ++#if 1 ++ /* d_splice_alias() also supports d_add() */ ++ ret = d_splice_alias(inode, dentry); ++ if (unlikely(IS_ERR(ret) && inode)) ++ ii_write_unlock(inode); ++#else ++ d_add(dentry, inode); ++#endif ++ } ++ ++ out_unlock: ++ di_write_unlock(dentry); ++ out: ++ aufs_read_unlock(parent, !AUFS_I_RLOCK); ++ TraceErrPtr(ret); ++ return ret; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * decide the branch and the parent dir where we will create a new entry. ++ * returns new bindex or an error. ++ * copyup the parent dir if needed. ++ */ ++int wr_dir(struct dentry *dentry, int add_entry, struct dentry *src_dentry, ++ aufs_bindex_t force_btgt, int do_lock_srcdir) ++{ ++ int err; ++ aufs_bindex_t bcpup, bstart, src_bstart; ++ struct dentry *hidden_parent; ++ struct super_block *sb; ++ struct dentry *parent, *src_parent = NULL; ++ struct inode *dir, *src_dir = NULL; ++ ++ LKTRTrace("%.*s, add %d, src %p, force %d, lock_srcdir %d\n", ++ DLNPair(dentry), add_entry, src_dentry, force_btgt, ++ do_lock_srcdir); ++ ++ sb = dentry->d_sb; ++ parent = dentry->d_parent; // dget_parent() ++ bcpup = bstart = dbstart(dentry); ++ if (force_btgt < 0) { ++ if (src_dentry) { ++ src_bstart = dbstart(src_dentry); ++ if (src_bstart < bstart) ++ bcpup = src_bstart; ++ } ++ if (test_ro(sb, bcpup, dentry->d_inode)) { ++ if (!add_entry) ++ di_read_lock_parent(parent, !AUFS_I_RLOCK); ++ bcpup = err = find_rw_parent_br(dentry, bcpup); ++ //bcpup = err = find_rw_br(sb, bcpup); ++ if (!add_entry) ++ di_read_unlock(parent, !AUFS_I_RLOCK); ++ //err = -1; ++ if (unlikely(err < 0)) ++ goto out; ++ } ++ } else { ++ DEBUG_ON(bstart <= force_btgt ++ || test_ro(sb, force_btgt, dentry->d_inode)); ++ bcpup = force_btgt; ++ } ++ LKTRTrace("bstart %d, bcpup %d\n", bstart, bcpup); ++ ++ err = bcpup; ++ if (bcpup == bstart) ++ goto out; /* success */ ++ ++ /* copyup the new parent into the branch we process */ ++ hidden_parent = au_h_dptr(dentry)->d_parent; // dget_parent() ++ if (src_dentry) { ++ src_parent = src_dentry->d_parent; // dget_parent() ++ src_dir = src_parent->d_inode; ++ if (do_lock_srcdir) ++ di_write_lock_parent2(src_parent); ++ } ++ ++ dir = parent->d_inode; ++ if (add_entry) { ++ au_update_dbstart(dentry); ++ IMustLock(dir); ++ DiMustWriteLock(parent); ++ IiMustWriteLock(dir); ++ } else ++ di_write_lock_parent(parent); ++ ++ err = 0; ++ if (!au_h_dptr_i(parent, bcpup)) ++ err = cpup_dirs(dentry, bcpup, src_parent); ++ //err = -1; ++ if (!err && add_entry) { ++ hidden_parent = au_h_dptr_i(parent, bcpup); ++ DEBUG_ON(!hidden_parent || !hidden_parent->d_inode); ++ hi_lock_parent(hidden_parent->d_inode); ++ err = lkup_neg(dentry, bcpup); ++ //err = -1; ++ i_unlock(hidden_parent->d_inode); ++ } ++ ++ if (!add_entry) ++ di_write_unlock(parent); ++ if (do_lock_srcdir) ++ di_write_unlock(src_parent); ++ if (!err) ++ err = bcpup; /* success */ ++ //err = -EPERM; ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int aufs_setattr(struct dentry *dentry, struct iattr *ia) ++{ ++ int err, isdir; ++ aufs_bindex_t bstart, bcpup; ++ struct inode *hidden_inode, *inode, *dir, *h_dir, *gh_dir, *gdir; ++ struct dentry *hidden_dentry, *parent; ++ unsigned int udba; ++ ++ LKTRTrace("%.*s, ia_valid 0x%x\n", DLNPair(dentry), ia->ia_valid); ++ inode = dentry->d_inode; ++ IMustLock(inode); ++ ++ aufs_read_lock(dentry, AUFS_D_WLOCK); ++ bstart = dbstart(dentry); ++ bcpup = err = wr_dir(dentry, /*add*/0, /*src_dentry*/NULL, ++ /*force_btgt*/-1, /*do_lock_srcdir*/0); ++ //err = -1; ++ if (unlikely(err < 0)) ++ goto out; ++ ++ /* crazy udba locks */ ++ udba = au_flag_test(dentry->d_sb, AuFlag_UDBA_INOTIFY); ++ parent = NULL; ++ gdir = gh_dir = dir = h_dir = NULL; ++ if ((udba || bstart != bcpup) && !IS_ROOT(dentry)) { ++ parent = dentry->d_parent; // dget_parent() ++ dir = parent->d_inode; ++ di_read_lock_parent(parent, AUFS_I_RLOCK); ++ h_dir = au_h_iptr_i(dir, bcpup); ++ } ++ if (parent) { ++ if (unlikely(udba && !IS_ROOT(parent))) { ++ gdir = parent->d_parent->d_inode; // dget_parent() ++ ii_read_lock_parent2(gdir); ++ gh_dir = au_h_iptr_i(gdir, bcpup); ++ hgdir_lock(gh_dir, gdir, bcpup); ++ } ++ hdir_lock(h_dir, dir, bcpup); ++ } ++ ++ isdir = S_ISDIR(inode->i_mode); ++ hidden_dentry = au_h_dptr(dentry); ++ hidden_inode = hidden_dentry->d_inode; ++ DEBUG_ON(!hidden_inode); ++ ++#define HiLock(bindex) do {\ ++ if (!isdir) \ ++ hi_lock_child(hidden_inode); \ ++ else \ ++ hdir2_lock(hidden_inode, inode, bindex); \ ++ } while (0) ++#define HiUnlock(bindex) do {\ ++ if (!isdir) \ ++ i_unlock(hidden_inode); \ ++ else \ ++ hdir_unlock(hidden_inode, inode, bindex); \ ++ } while (0) ++ ++ if (bstart != bcpup) { ++ loff_t size = -1; ++ ++ if ((ia->ia_valid & ATTR_SIZE) ++ && ia->ia_size < i_size_read(inode)) { ++ size = ia->ia_size; ++ ia->ia_valid &= ~ATTR_SIZE; ++ } ++ HiLock(bstart); ++ err = sio_cpup_simple(dentry, bcpup, size, ++ au_flags_cpup(CPUP_DTIME, parent)); ++ //err = -1; ++ HiUnlock(bstart); ++ if (unlikely(err || !ia->ia_valid)) ++ goto out_unlock; ++ ++ hidden_dentry = au_h_dptr(dentry); ++ hidden_inode = hidden_dentry->d_inode; ++ DEBUG_ON(!hidden_inode); ++ } ++ ++ HiLock(bcpup); ++ err = vfsub_notify_change(hidden_dentry, ia, need_dlgt(dentry->d_sb)); ++ //err = -1; ++ if (!err) ++ au_cpup_attr_changable(inode); ++ HiUnlock(bcpup); ++#undef HiLock ++#undef HiUnlock ++ ++ out_unlock: ++ if (parent) { ++ hdir_unlock(h_dir, dir, bcpup); ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ } ++ if (unlikely(gdir)) { ++ hdir_unlock(gh_dir, gdir, bcpup); ++ ii_read_unlock(gdir); ++ } ++ out: ++ aufs_read_unlock(dentry, AUFS_D_WLOCK); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int hidden_readlink(struct dentry *dentry, int bindex, ++ char __user * buf, int bufsiz) ++{ ++ struct super_block *sb; ++ struct dentry *hidden_dentry; ++ ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (unlikely(!hidden_dentry->d_inode->i_op ++ || !hidden_dentry->d_inode->i_op->readlink)) ++ return -EINVAL; ++ ++ sb = dentry->d_sb; ++ if (!test_ro(sb, bindex, dentry->d_inode)) { ++ touch_atime(sbr_mnt(sb, bindex), hidden_dentry); ++ dentry->d_inode->i_atime = hidden_dentry->d_inode->i_atime; ++ } ++ return hidden_dentry->d_inode->i_op->readlink ++ (hidden_dentry, buf, bufsiz); ++} ++ ++static int aufs_readlink(struct dentry *dentry, char __user * buf, int bufsiz) ++{ ++ int err; ++ ++ LKTRTrace("%.*s, %d\n", DLNPair(dentry), bufsiz); ++ ++ aufs_read_lock(dentry, AUFS_I_RLOCK); ++ err = hidden_readlink(dentry, dbstart(dentry), buf, bufsiz); ++ //err = -1; ++ aufs_read_unlock(dentry, AUFS_I_RLOCK); ++ TraceErr(err); ++ return err; ++} ++ ++static void *aufs_follow_link(struct dentry *dentry, struct nameidata *nd) ++{ ++ int err; ++ char *buf; ++ mm_segment_t old_fs; ++ ++ LKTRTrace("%.*s, nd %.*s\n", DLNPair(dentry), DLNPair(nd->dentry)); ++ ++ err = -ENOMEM; ++ buf = __getname(); ++ //buf = NULL; ++ if (unlikely(!buf)) ++ goto out; ++ ++ aufs_read_lock(dentry, AUFS_I_RLOCK); ++ old_fs = get_fs(); ++ set_fs(KERNEL_DS); ++ err = hidden_readlink(dentry, dbstart(dentry), (char __user *)buf, ++ PATH_MAX); ++ //err = -1; ++ set_fs(old_fs); ++ aufs_read_unlock(dentry, AUFS_I_RLOCK); ++ ++ if (err >= 0) { ++ buf[err] = 0; ++ /* will be freed by put_link */ ++ nd_set_link(nd, buf); ++ return NULL; /* success */ ++ } ++ __putname(buf); ++ ++ out: ++ path_release(nd); ++ TraceErr(err); ++ return ERR_PTR(err); ++} ++ ++static void aufs_put_link(struct dentry *dentry, struct nameidata *nd, ++ void *cookie) ++{ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ __putname(nd_get_link(nd)); ++} ++ ++/* ---------------------------------------------------------------------- */ ++#if 0 // comment ++struct inode_operations { ++ int (*create) (struct inode *,struct dentry *,int, struct nameidata *); ++ struct dentry * (*lookup) (struct inode *,struct dentry *, struct nameidata *); ++ int (*link) (struct dentry *,struct inode *,struct dentry *); ++ int (*unlink) (struct inode *,struct dentry *); ++ int (*symlink) (struct inode *,struct dentry *,const char *); ++ int (*mkdir) (struct inode *,struct dentry *,int); ++ int (*rmdir) (struct inode *,struct dentry *); ++ int (*mknod) (struct inode *,struct dentry *,int,dev_t); ++ int (*rename) (struct inode *, struct dentry *, ++ struct inode *, struct dentry *); ++ int (*readlink) (struct dentry *, char __user *,int); ++ void * (*follow_link) (struct dentry *, struct nameidata *); ++ void (*put_link) (struct dentry *, struct nameidata *, void *); ++ void (*truncate) (struct inode *); ++ int (*permission) (struct inode *, int, struct nameidata *); ++ int (*setattr) (struct dentry *, struct iattr *); ++ int (*getattr) (struct vfsmount *mnt, struct dentry *, struct kstat *); ++ int (*setxattr) (struct dentry *, const char *,const void *,size_t,int); ++ ssize_t (*getxattr) (struct dentry *, const char *, void *, size_t); ++ ssize_t (*listxattr) (struct dentry *, char *, size_t); ++ int (*removexattr) (struct dentry *, const char *); ++ void (*truncate_range)(struct inode *, loff_t, loff_t); ++}; ++#endif ++ ++struct inode_operations aufs_symlink_iop = { ++ .permission = aufs_permission, ++ .setattr = aufs_setattr, ++ ++ .readlink = aufs_readlink, ++ .follow_link = aufs_follow_link, ++ .put_link = aufs_put_link ++}; ++ ++//i_op_add.c ++int aufs_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev); ++int aufs_symlink(struct inode *dir, struct dentry *dentry, const char *symname); ++int aufs_create(struct inode *dir, struct dentry *dentry, int mode, ++ struct nameidata *nd); ++int aufs_link(struct dentry *src_dentry, struct inode *dir, ++ struct dentry *dentry); ++int aufs_mkdir(struct inode *dir, struct dentry *dentry, int mode); ++ ++//i_op_del.c ++int aufs_unlink(struct inode *dir, struct dentry *dentry); ++int aufs_rmdir(struct inode *dir, struct dentry *dentry); ++ ++// i_op_ren.c ++int aufs_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry); ++ ++struct inode_operations aufs_dir_iop = { ++ .create = aufs_create, ++ .lookup = aufs_lookup, ++ .link = aufs_link, ++ .unlink = aufs_unlink, ++ .symlink = aufs_symlink, ++ .mkdir = aufs_mkdir, ++ .rmdir = aufs_rmdir, ++ .mknod = aufs_mknod, ++ .rename = aufs_rename, ++ ++ .permission = aufs_permission, ++ .setattr = aufs_setattr, ++ ++#if 0 // xattr ++ .setxattr = aufs_setxattr, ++ .getxattr = aufs_getxattr, ++ .listxattr = aufs_listxattr, ++ .removexattr = aufs_removexattr ++#endif ++}; ++ ++struct inode_operations aufs_iop = { ++ .permission = aufs_permission, ++ .setattr = aufs_setattr, ++ ++#if 0 // xattr ++ .setxattr = aufs_setxattr, ++ .getxattr = aufs_getxattr, ++ .listxattr = aufs_listxattr, ++ .removexattr = aufs_removexattr ++#endif ++}; +diff --git a/fs/aufs/i_op_add.c b/fs/aufs/i_op_add.c +new file mode 100755 +index 0000000..977d773 +--- /dev/null ++++ b/fs/aufs/i_op_add.c +@@ -0,0 +1,621 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: i_op_add.c,v 1.37 2007/05/07 03:46:08 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++//#include <linux/namei.h> ++#include "aufs.h" ++ ++/* ++ * final procedure of adding a new entry, except link(2). ++ * remove whiteout, instantiate, copyup the parent dir's times and size ++ * and update version. ++ * if it failed, re-create the removed whiteout. ++ */ ++static int epilog(struct dentry *wh_dentry, struct dentry *dentry) ++{ ++ int err, rerr; ++ aufs_bindex_t bwh; ++ struct inode *inode, *dir; ++ struct dentry *wh; ++ struct lkup_args lkup; ++ ++ LKTRTrace("wh %p, %.*s\n", wh_dentry, DLNPair(dentry)); ++ ++ lkup.dlgt = need_dlgt(dentry->d_sb); ++ bwh = -1; ++ if (wh_dentry) { ++ bwh = dbwh(dentry); ++ err = au_unlink_wh_dentry(wh_dentry->d_parent->d_inode, ++ wh_dentry, dentry, lkup.dlgt); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ } ++ ++ inode = au_new_inode(dentry); ++ //inode = ERR_PTR(-1); ++ if (!IS_ERR(inode)) { ++ d_instantiate(dentry, inode); ++ dir = dentry->d_parent->d_inode; ++ /* or always cpup dir mtime? */ ++ if (ibstart(dir) == dbstart(dentry)) ++ au_cpup_attr_timesizes(dir); ++ dir->i_version++; ++ return 0; /* success */ ++ } ++ ++ err = PTR_ERR(inode); ++ if (!wh_dentry) ++ goto out; ++ ++ /* revert */ ++ lkup.nfsmnt = au_nfsmnt(dentry->d_sb, bwh); ++ wh = simple_create_wh(dentry, bwh, wh_dentry->d_parent, &lkup); ++ //wh = ERR_PTR(-1); ++ rerr = PTR_ERR(wh); ++ if (!IS_ERR(wh)) { ++ dput(wh); ++ goto out; ++ } ++ IOErr("%.*s reverting whiteout failed(%d, %d)\n", ++ DLNPair(dentry), err, rerr); ++ err = -EIO; ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * initial procedure of adding a new entry. ++ * prepare writable branch and the parent dir, lock it, ++ * lookup whiteout for the new entry. ++ */ ++static struct dentry * ++lock_hdir_lkup_wh(struct dentry *dentry, struct dtime *dt, ++ struct dentry *src_dentry, int do_lock_srcdir) ++{ ++ struct dentry *wh_dentry, *parent, *hidden_parent; ++ int err; ++ aufs_bindex_t bstart, bcpup; ++ struct inode *dir, *h_dir; ++ struct lkup_args lkup; ++ ++ LKTRTrace("%.*s, src %p\n", DLNPair(dentry), src_dentry); ++ ++ parent = dentry->d_parent; ++ bstart = dbstart(dentry); ++ bcpup = err = wr_dir(dentry, 1, src_dentry, -1, do_lock_srcdir); ++ //err = -1; ++ wh_dentry = ERR_PTR(err); ++ if (unlikely(err < 0)) ++ goto out; ++ ++ dir = parent->d_inode; ++ hidden_parent = au_h_dptr_i(parent, bcpup); ++ h_dir = hidden_parent->d_inode; ++ hdir_lock(h_dir, dir, bcpup); ++ if (dt) ++ dtime_store(dt, parent, hidden_parent); ++ if (/* bcpup != bstart || */ bcpup != dbwh(dentry)) ++ return NULL; /* success */ ++ ++ lkup.nfsmnt = au_nfsmnt(parent->d_sb, bcpup); ++ lkup.dlgt = need_dlgt(parent->d_sb); ++ wh_dentry = lkup_wh(hidden_parent, &dentry->d_name, &lkup); ++ //wh_dentry = ERR_PTR(-1); ++ if (IS_ERR(wh_dentry)) ++ hdir_unlock(h_dir, dir, bcpup); ++ ++ out: ++ TraceErrPtr(wh_dentry); ++ return wh_dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++enum {Mknod, Symlink, Creat}; ++struct simple_arg { ++ int type; ++ union { ++ struct { ++ int mode; ++ struct nameidata *nd; ++ } c; ++ struct { ++ const char *symname; ++ } s; ++ struct { ++ int mode; ++ dev_t dev; ++ } m; ++ } u; ++}; ++ ++static int add_simple(struct inode *dir, struct dentry *dentry, ++ struct simple_arg *arg) ++{ ++ int err, dlgt; ++ struct dentry *hidden_dentry, *hidden_parent, *wh_dentry, *parent; ++ struct inode *hidden_dir; ++ struct dtime dt; ++ ++ LKTRTrace("type %d, %.*s\n", arg->type, DLNPair(dentry)); ++ IMustLock(dir); ++ ++ aufs_read_lock(dentry, AUFS_D_WLOCK); ++ parent = dentry->d_parent; ++ di_write_lock_parent(parent); ++ wh_dentry = lock_hdir_lkup_wh(dentry, &dt, /*src_dentry*/NULL, ++ /*do_lock_srcdir*/0); ++ //wh_dentry = ERR_PTR(-1); ++ err = PTR_ERR(wh_dentry); ++ if (IS_ERR(wh_dentry)) ++ goto out; ++ ++ hidden_dentry = au_h_dptr(dentry); ++ hidden_parent = hidden_dentry->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ dlgt = need_dlgt(dir->i_sb); ++ ++#if 1 // partial testing ++ switch (arg->type) { ++ case Creat: ++#if 0 ++ if (arg->u.c.nd) { ++ struct nameidata fake_nd; ++ fake_nd = *arg->u.c.nd; ++ fake_nd.dentry = dget(hidden_parent); ++ fake_nd.mnt = sbr_mnt(dentry->d_sb, dbstart(dentry)); ++ mntget(fake_nd.mnt); ++ err = vfsub_create(hidden_dir, hidden_dentry, ++ arg->u.c.mode, &fake_nd, dlgt); ++ path_release(&fake_nd); ++ } else ++#endif ++ err = vfsub_create(hidden_dir, hidden_dentry, ++ arg->u.c.mode, NULL, dlgt); ++ break; ++ case Symlink: ++ err = vfsub_symlink(hidden_dir, hidden_dentry, ++ arg->u.s.symname, S_IALLUGO, dlgt); ++ break; ++ case Mknod: ++ err = vfsub_mknod(hidden_dir, hidden_dentry, ++ arg->u.m.mode, arg->u.m.dev, dlgt); ++ break; ++ default: ++ BUG(); ++ } ++#else ++ err = -1; ++#endif ++ if (!err) ++ err = epilog(wh_dentry, dentry); ++ //err = -1; ++ ++ /* revert */ ++ if (unlikely(err && hidden_dentry->d_inode)) { ++ int rerr; ++ rerr = vfsub_unlink(hidden_dir, hidden_dentry, dlgt); ++ //rerr = -1; ++ if (rerr) { ++ IOErr("%.*s revert failure(%d, %d)\n", ++ DLNPair(dentry), err, rerr); ++ err = -EIO; ++ } ++ dtime_revert(&dt, !CPUP_LOCKED_GHDIR); ++ d_drop(dentry); ++ } ++ ++ hdir_unlock(hidden_dir, dir, dbstart(dentry)); ++ dput(wh_dentry); ++ ++ out: ++ if (unlikely(err)) { ++ au_update_dbstart(dentry); ++ d_drop(dentry); ++ } ++ di_write_unlock(parent); ++ aufs_read_unlock(dentry, AUFS_D_WLOCK); ++ TraceErr(err); ++ return err; ++} ++ ++int aufs_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev) ++{ ++ struct simple_arg arg = { ++ .type = Mknod, ++ .u.m = {.mode = mode, .dev = dev} ++ }; ++ return add_simple(dir, dentry, &arg); ++} ++ ++int aufs_symlink(struct inode *dir, struct dentry *dentry, const char *symname) ++{ ++ struct simple_arg arg = { ++ .type = Symlink, ++ .u.s.symname = symname ++ }; ++ return add_simple(dir, dentry, &arg); ++} ++ ++int aufs_create(struct inode *dir, struct dentry *dentry, int mode, ++ struct nameidata *nd) ++{ ++ struct simple_arg arg = { ++ .type = Creat, ++ .u.c = {.mode = mode, .nd = nd} ++ }; ++ return add_simple(dir, dentry, &arg); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct link_arg { ++ aufs_bindex_t bdst, bsrc; ++ int issamedir, dlgt; ++ struct dentry *src_parent, *parent, *hidden_dentry; ++ struct inode *hidden_dir, *inode; ++}; ++ ++static int cpup_before_link(struct dentry *src_dentry, struct inode *dir, ++ struct link_arg *a) ++{ ++ int err; ++ unsigned int flags; ++ struct inode *hi, *hdir = NULL, *src_dir; ++ ++ TraceEnter(); ++ ++ err = 0; ++ flags = au_flags_cpup(CPUP_DTIME, a->parent); ++ src_dir = a->src_parent->d_inode; ++ if (!a->issamedir) { ++ // todo: dead lock? ++ di_read_lock_parent2(a->src_parent, AUFS_I_RLOCK); ++ // this temporary unlock/lock is safe ++ hdir_unlock(a->hidden_dir, dir, a->bdst); ++ err = test_and_cpup_dirs(src_dentry, a->bdst, a->parent); ++ //err = -1; ++ if (!err) { ++ hdir = au_h_iptr_i(src_dir, a->bdst); ++ hdir_lock(hdir, src_dir, a->bdst); ++ flags = au_flags_cpup(CPUP_DTIME, a->src_parent); ++ } ++ } ++ ++ if (!err) { ++ hi = au_h_dptr(src_dentry)->d_inode; ++ hi_lock_child(hi); ++ err = sio_cpup_simple(src_dentry, a->bdst, -1, flags); ++ //err = -1; ++ i_unlock(hi); ++ } ++ ++ if (!a->issamedir) { ++ if (hdir) ++ hdir_unlock(hdir, src_dir, a->bdst); ++ hdir_lock(a->hidden_dir, dir, a->bdst); ++ di_read_unlock(a->src_parent, AUFS_I_RLOCK); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int cpup_or_link(struct dentry *src_dentry, struct link_arg *a) ++{ ++ int err; ++ struct inode *inode, *h_inode, *h_dst_inode; ++ struct dentry *h_dentry; ++ aufs_bindex_t bstart; ++ struct super_block *sb; ++ ++ TraceEnter(); ++ ++ sb = src_dentry->d_sb; ++ inode = src_dentry->d_inode; ++ h_dentry = au_h_dptr(src_dentry); ++ h_inode = h_dentry->d_inode; ++ bstart = ibstart(inode); ++ h_dst_inode = NULL; ++ if (bstart <= a->bdst) ++ h_dst_inode = au_h_iptr_i(inode, a->bdst); ++ ++ if (!h_dst_inode) { ++ /* copyup src_dentry as the name of dentry. */ ++ set_dbstart(src_dentry, a->bdst); ++ set_h_dptr(src_dentry, a->bdst, dget(a->hidden_dentry)); ++ hi_lock_child(h_inode); ++ err = sio_cpup_single(src_dentry, a->bdst, a->bsrc, -1, ++ au_flags_cpup(!CPUP_DTIME, a->parent)); ++ //err = -1; ++ i_unlock(h_inode); ++ set_h_dptr(src_dentry, a->bdst, NULL); ++ set_dbstart(src_dentry, a->bsrc); ++ } else { ++ /* the inode of src_dentry already exists on a.bdst branch */ ++ h_dentry = d_find_alias(h_dst_inode); ++ if (h_dentry) { ++ err = vfsub_link(h_dentry, a->hidden_dir, ++ a->hidden_dentry, a->dlgt); ++ dput(h_dentry); ++ } else { ++ IOErr("no dentry found for i%lu on b%d\n", ++ h_dst_inode->i_ino, a->bdst); ++ err = -EIO; ++ } ++ } ++ ++ if (!err) ++ append_plink(sb, a->inode, a->hidden_dentry, a->bdst); ++ ++ TraceErr(err); ++ return err; ++} ++ ++int aufs_link(struct dentry *src_dentry, struct inode *dir, ++ struct dentry *dentry) ++{ ++ int err, rerr; ++ struct dentry *hidden_parent, *wh_dentry, *hidden_src_dentry; ++ struct dtime dt; ++ struct link_arg a; ++ struct super_block *sb; ++ ++ LKTRTrace("src %.*s, i%lu, dst %.*s\n", ++ DLNPair(src_dentry), dir->i_ino, DLNPair(dentry)); ++ IMustLock(dir); ++ IMustLock(src_dentry->d_inode); ++ ++ aufs_read_and_write_lock2(dentry, src_dentry, /*isdir*/0); ++ a.src_parent = src_dentry->d_parent; ++ a.parent = dentry->d_parent; ++ a.issamedir = (a.src_parent == a.parent); ++ di_write_lock_parent(a.parent); ++ wh_dentry = lock_hdir_lkup_wh(dentry, &dt, src_dentry, !a.issamedir); ++ //wh_dentry = ERR_PTR(-1); ++ err = PTR_ERR(wh_dentry); ++ if (IS_ERR(wh_dentry)) ++ goto out; ++ ++ a.inode = src_dentry->d_inode; ++ a.hidden_dentry = au_h_dptr(dentry); ++ hidden_parent = a.hidden_dentry->d_parent; ++ a.hidden_dir = hidden_parent->d_inode; ++ IMustLock(a.hidden_dir); ++ ++ err = 0; ++ sb = dentry->d_sb; ++ a.dlgt = need_dlgt(sb); ++ ++ //todo: minor optimize, their sb may be same while their bindex differs. ++ a.bsrc = dbstart(src_dentry); ++ a.bdst = dbstart(dentry); ++ hidden_src_dentry = au_h_dptr(src_dentry); ++ if (unlikely(!au_flag_test(sb, AuFlag_PLINK))) { ++ /* ++ * copyup src_dentry to the branch we process, ++ * and then link(2) to it. ++ * gave up 'pseudo link by cpup' approach, ++ * since nlink may be one and some applications will not work. ++ */ ++ if (a.bdst < a.bsrc ++ /* && hidden_src_dentry->d_sb != a.hidden_dentry->d_sb */) ++ err = cpup_before_link(src_dentry, dir, &a); ++ if (!err) { ++ hidden_src_dentry = au_h_dptr(src_dentry); ++ err = vfsub_link(hidden_src_dentry, a.hidden_dir, ++ a.hidden_dentry, a.dlgt); ++ //err = -1; ++ } ++ } else { ++ if (a.bdst < a.bsrc ++ /* && hidden_src_dentry->d_sb != a.hidden_dentry->d_sb */) ++ err = cpup_or_link(src_dentry, &a); ++ else { ++ hidden_src_dentry = au_h_dptr(src_dentry); ++ err = vfsub_link(hidden_src_dentry, a.hidden_dir, ++ a.hidden_dentry, a.dlgt); ++ //err = -1; ++ } ++ } ++ if (unlikely(err)) ++ goto out_unlock; ++ if (wh_dentry) { ++ err = au_unlink_wh_dentry(a.hidden_dir, wh_dentry, dentry, ++ a.dlgt); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_revert; ++ } ++ ++ dir->i_version++; ++ if (ibstart(dir) == dbstart(dentry)) ++ au_cpup_attr_timesizes(dir); ++ if (!d_unhashed(a.hidden_dentry) ++ /* || hidden_old_inode->i_nlink <= nlink */ ++ /* || SB_NFS(hidden_src_dentry->d_sb) */) { ++ dentry->d_inode = igrab(a.inode); ++ d_instantiate(dentry, a.inode); ++ a.inode->i_nlink++; ++ a.inode->i_ctime = dir->i_ctime; ++ } else ++ /* nfs case (< 2.6.15) */ ++ d_drop(dentry); ++#if 0 ++ au_debug_on(); ++ DbgInode(a.inode); ++ au_debug_off(); ++ { ++ aufs_bindex_t i; ++ for (i = ibstart(a.inode); i <= ibend(a.inode); i++) { ++ struct xino xino; ++ struct inode *hi; ++ hi = au_h_iptr_i(a.inode, i); ++ if (hi) { ++ xino_read(sb, i, hi->i_ino, &xino); ++ Dbg("hi%lu, i%lu\n", hi->i_ino, xino.ino); ++ } ++ } ++ } ++#endif ++ goto out_unlock; /* success */ ++ ++ out_revert: ++#if 0 // remove ++ if (d_unhashed(a.hidden_dentry)) { ++ /* hardlink on nfs (< 2.6.15) */ ++ struct dentry *d; ++ const struct qstr *name = &a.hidden_dentry->d_name; ++ DEBUG_ON(a.hidden_dentry->d_parent->d_inode != a.hidden_dir); ++ // do not superio. ++ d = lkup_one(name->name, a.hidden_dentry->d_parent, name->len, ++ au_nfsmnt(sb, a.bdst)??, need_dlgt(sb)); ++ rerr = PTR_ERR(d); ++ if (IS_ERR(d)) ++ goto out_rerr; ++ dput(a.hidden_dentry); ++ a.hidden_dentry = d; ++ DEBUG_ON(!d->d_inode); ++ } ++#endif ++ rerr = vfsub_unlink(a.hidden_dir, a.hidden_dentry, a.dlgt); ++ //rerr = -1; ++ if (!rerr) ++ goto out_dt; ++// out_rerr: ++ IOErr("%.*s reverting failed(%d, %d)\n", DLNPair(dentry), err, rerr); ++ err = -EIO; ++ out_dt: ++ d_drop(dentry); ++ dtime_revert(&dt, !CPUP_LOCKED_GHDIR); ++ out_unlock: ++ hdir_unlock(a.hidden_dir, dir, a.bdst); ++ dput(wh_dentry); ++ out: ++ if (unlikely(err)) { ++ au_update_dbstart(dentry); ++ d_drop(dentry); ++ } ++ di_write_unlock(a.parent); ++ aufs_read_and_write_unlock2(dentry, src_dentry); ++ TraceErr(err); ++ return err; ++} ++ ++int aufs_mkdir(struct inode *dir, struct dentry *dentry, int mode) ++{ ++ int err, rerr, diropq, dlgt; ++ struct dentry *hidden_dentry, *hidden_parent, *wh_dentry, *parent, ++ *opq_dentry; ++ struct inode *hidden_dir, *hidden_inode; ++ struct dtime dt; ++ aufs_bindex_t bindex; ++ struct super_block *sb; ++ ++ LKTRTrace("i%lu, %.*s, mode 0%o\n", dir->i_ino, DLNPair(dentry), mode); ++ IMustLock(dir); ++ ++ aufs_read_lock(dentry, AUFS_D_WLOCK); ++ parent = dentry->d_parent; ++ di_write_lock_parent(parent); ++ wh_dentry = lock_hdir_lkup_wh(dentry, &dt, /*src_dentry*/NULL, ++ /*do_lock_srcdir*/0); ++ //wh_dentry = ERR_PTR(-1); ++ err = PTR_ERR(wh_dentry); ++ if (IS_ERR(wh_dentry)) ++ goto out; ++ ++ sb = dentry->d_sb; ++ bindex = dbstart(dentry); ++ hidden_dentry = au_h_dptr(dentry); ++ hidden_parent = hidden_dentry->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ dlgt = need_dlgt(sb); ++ ++ err = vfsub_mkdir(hidden_dir, hidden_dentry, mode, dlgt); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_unlock; ++ hidden_inode = hidden_dentry->d_inode; ++ ++ /* make the dir opaque */ ++ diropq = 0; ++ if (unlikely(wh_dentry || au_flag_test(sb, AuFlag_ALWAYS_DIROPQ))) { ++ hi_lock_child(hidden_inode); ++ opq_dentry = create_diropq(dentry, bindex, dlgt); ++ //opq_dentry = ERR_PTR(-1); ++ i_unlock(hidden_inode); ++ err = PTR_ERR(opq_dentry); ++ if (IS_ERR(opq_dentry)) ++ goto out_dir; ++ dput(opq_dentry); ++ diropq = 1; ++ } ++ ++ err = epilog(wh_dentry, dentry); ++ //err = -1; ++ if (!err) { ++ dir->i_nlink++; ++ goto out_unlock; /* success */ ++ } ++ ++ /* revert */ ++ if (unlikely(diropq)) { ++ LKTRLabel(revert opq); ++ hi_lock_child(hidden_inode); ++ rerr = remove_diropq(dentry, bindex, dlgt); ++ //rerr = -1; ++ i_unlock(hidden_inode); ++ if (rerr) { ++ IOErr("%.*s reverting diropq failed(%d, %d)\n", ++ DLNPair(dentry), err, rerr); ++ err = -EIO; ++ } ++ } ++ ++ out_dir: ++ LKTRLabel(revert dir); ++ rerr = vfsub_rmdir(hidden_dir, hidden_dentry, dlgt); ++ //rerr = -1; ++ if (rerr) { ++ IOErr("%.*s reverting dir failed(%d, %d)\n", ++ DLNPair(dentry), err, rerr); ++ err = -EIO; ++ } ++ d_drop(dentry); ++ dtime_revert(&dt, /*fake flag*/CPUP_LOCKED_GHDIR); ++ out_unlock: ++ hdir_unlock(hidden_dir, dir, bindex); ++ dput(wh_dentry); ++ out: ++ if (unlikely(err)) { ++ au_update_dbstart(dentry); ++ d_drop(dentry); ++ } ++ di_write_unlock(parent); ++ aufs_read_unlock(dentry, AUFS_D_WLOCK); ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/i_op_del.c b/fs/aufs/i_op_del.c +new file mode 100755 +index 0000000..f29b204 +--- /dev/null ++++ b/fs/aufs/i_op_del.c +@@ -0,0 +1,414 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: i_op_del.c,v 1.35 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++/* returns, ++ * 0: wh is unnecessary ++ * plus: wh is necessary ++ * minus: error ++ */ ++int wr_dir_need_wh(struct dentry *dentry, int isdir, aufs_bindex_t *bcpup, ++ struct dentry *locked) ++{ ++ int need_wh, err; ++ aufs_bindex_t bstart; ++ struct dentry *hidden_dentry; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, isdir %d, *bcpup %d, locked %p\n", ++ DLNPair(dentry), isdir, *bcpup, locked); ++ sb = dentry->d_sb; ++ ++ bstart = dbstart(dentry); ++ LKTRTrace("bcpup %d, bstart %d\n", *bcpup, bstart); ++ hidden_dentry = au_h_dptr(dentry); ++ if (*bcpup < 0) { ++ *bcpup = bstart; ++ if (test_ro(sb, bstart, dentry->d_inode)) { ++ *bcpup = err = find_rw_parent_br(dentry, bstart); ++ //*bcpup = err = find_rw_br(sb, bstart); ++ //err = -1; ++ if (unlikely(err < 0)) ++ goto out; ++ } ++ } else { ++ /* braces are added to stop a warning */ ++ DEBUG_ON(bstart < *bcpup ++ || test_ro(sb, *bcpup, dentry->d_inode)); ++ } ++ LKTRTrace("bcpup %d, bstart %d\n", *bcpup, bstart); ++ ++ if (*bcpup != bstart) { ++ err = cpup_dirs(dentry, *bcpup, locked); ++ //err = -1; ++ if (unlikely(err)) ++ goto out; ++ need_wh = 1; ++ } else { ++ //struct nameidata nd; ++ aufs_bindex_t old_bend, new_bend, bdiropq = -1; ++ old_bend = dbend(dentry); ++ if (isdir) { ++ bdiropq = dbdiropq(dentry); ++ set_dbdiropq(dentry, -1); ++ } ++ err = need_wh = lkup_dentry(dentry, bstart + 1, /*type*/0); ++ //err = -1; ++ if (isdir) ++ set_dbdiropq(dentry, bdiropq); ++ if (unlikely(err < 0)) ++ goto out; ++ new_bend = dbend(dentry); ++ if (!need_wh && old_bend != new_bend) { ++ set_h_dptr(dentry, new_bend, NULL); ++ set_dbend(dentry, old_bend); ++#if 0 ++ } else if (!au_h_dptr_i(dentry, new_bend)->d_inode) { ++ LKTRTrace("negative\n"); ++ set_h_dptr(dentry, new_bend, NULL); ++ set_dbend(dentry, old_bend); ++ need_wh = 0; ++#endif ++ } ++ } ++ LKTRTrace("need_wh %d\n", need_wh); ++ err = need_wh; ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static struct dentry * ++lock_hdir_create_wh(struct dentry *dentry, int isdir, aufs_bindex_t *bcpup, ++ struct dtime *dt) ++{ ++ struct dentry *wh_dentry; ++ int err, need_wh; ++ struct dentry *hidden_parent, *parent; ++ struct inode *dir, *h_dir; ++ struct lkup_args lkup; ++ ++ LKTRTrace("%.*s, isdir %d\n", DLNPair(dentry), isdir); ++ ++ err = need_wh = wr_dir_need_wh(dentry, isdir, bcpup, NULL); ++ //err = -1; ++ wh_dentry = ERR_PTR(err); ++ if (unlikely(err < 0)) ++ goto out; ++ ++ parent = dentry->d_parent; ++ dir = parent->d_inode; ++ hidden_parent = au_h_dptr_i(parent, *bcpup); ++ h_dir = hidden_parent->d_inode; ++ hdir_lock(h_dir, dir, *bcpup); ++ dtime_store(dt, parent, hidden_parent); ++ if (!need_wh) ++ return NULL; /* success, no need to create whiteout */ ++ ++ lkup.nfsmnt = au_nfsmnt(dentry->d_sb, *bcpup); ++ lkup.dlgt = need_dlgt(dentry->d_sb); ++ wh_dentry = simple_create_wh(dentry, *bcpup, hidden_parent, &lkup); ++ //wh_dentry = ERR_PTR(-1); ++ if (!IS_ERR(wh_dentry)) ++ goto out; /* success */ ++ /* returns with the parent is locked and wh_dentry is DGETed */ ++ ++ hdir_unlock(h_dir, dir, *bcpup); ++ ++ out: ++ TraceErrPtr(wh_dentry); ++ return wh_dentry; ++} ++ ++static int renwh_and_rmdir(struct dentry *dentry, aufs_bindex_t bindex, ++ struct aufs_nhash *whlist, struct inode *dir) ++{ ++ int rmdir_later, err; ++ struct dentry *hidden_dentry; ++ ++ LKTRTrace("%.*s, b%d\n", DLNPair(dentry), bindex); ++ ++ err = rename_whtmp(dentry, bindex); ++ //err = -1; ++#if 0 ++ //todo: bug ++ if (unlikely(err)) { ++ au_direval_inc(dentry->d_parent); ++ return err; ++ } ++#endif ++ ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (!au_is_nfs(hidden_dentry->d_sb)) { ++ const int dirwh = stosi(dentry->d_sb)->si_dirwh; ++ rmdir_later = (dirwh <= 1); ++ if (!rmdir_later) ++ rmdir_later = is_longer_wh(whlist, bindex, dirwh); ++ if (rmdir_later) ++ return rmdir_later; ++ } ++ ++ err = rmdir_whtmp(hidden_dentry, whlist, bindex, dir, dentry->d_inode); ++ //err = -1; ++ if (unlikely(err)) { ++ IOErr("rmdir %.*s, b%d failed, %d. ignored\n", ++ DLNPair(hidden_dentry), bindex, err); ++ err = 0; ++ } ++ TraceErr(err); ++ return err; ++} ++ ++static void epilog(struct inode *dir, struct dentry *dentry, ++ aufs_bindex_t bindex) ++{ ++ d_drop(dentry); ++ dentry->d_inode->i_ctime = dir->i_ctime; ++ if (atomic_read(&dentry->d_count) == 1) { ++ set_h_dptr(dentry, dbstart(dentry), NULL); ++ au_update_dbstart(dentry); ++ } ++ if (ibstart(dir) == bindex) ++ au_cpup_attr_timesizes(dir); ++ dir->i_version++; ++} ++ ++static int do_revert(int err, struct dentry *wh_dentry, struct dentry *dentry, ++ aufs_bindex_t bwh, struct dtime *dt, int dlgt) ++{ ++ int rerr; ++ ++ rerr = au_unlink_wh_dentry(wh_dentry->d_parent->d_inode, wh_dentry, ++ dentry, dlgt); ++ //rerr = -1; ++ if (!rerr) { ++ set_dbwh(dentry, bwh); ++ dtime_revert(dt, !CPUP_LOCKED_GHDIR); ++ return 0; ++ } ++ ++ IOErr("%.*s reverting whiteout failed(%d, %d)\n", ++ DLNPair(dentry), err, rerr); ++ return -EIO; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++int aufs_unlink(struct inode *dir, struct dentry *dentry) ++{ ++ int err, dlgt; ++ struct inode *inode, *hidden_dir; ++ struct dentry *parent, *wh_dentry, *hidden_dentry, *hidden_parent; ++ struct dtime dt; ++ aufs_bindex_t bwh, bindex, bstart; ++ struct super_block *sb; ++ ++ LKTRTrace("i%lu, %.*s\n", dir->i_ino, DLNPair(dentry)); ++ IMustLock(dir); ++ inode = dentry->d_inode; ++ if (unlikely(!inode)) ++ return -ENOENT; // possible? ++ IMustLock(inode); ++ ++ aufs_read_lock(dentry, AUFS_D_WLOCK); ++ parent = dentry->d_parent; ++ di_write_lock_parent(parent); ++ ++ bstart = dbstart(dentry); ++ bwh = dbwh(dentry); ++ bindex = -1; ++ wh_dentry = lock_hdir_create_wh(dentry, /*isdir*/0, &bindex, &dt); ++ //wh_dentry = ERR_PTR(-1); ++ err = PTR_ERR(wh_dentry); ++ if (IS_ERR(wh_dentry)) ++ goto out; ++ ++ sb = dir->i_sb; ++ dlgt = need_dlgt(sb); ++ hidden_dentry = au_h_dptr(dentry); ++ dget(hidden_dentry); ++ hidden_parent = hidden_dentry->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ ++ if (bindex == bstart) { ++ err = vfsub_unlink(hidden_dir, hidden_dentry, dlgt); ++ //err = -1; ++ } else { ++ DEBUG_ON(!wh_dentry); ++ hidden_parent = wh_dentry->d_parent; ++ DEBUG_ON(hidden_parent != au_h_dptr_i(parent, bindex)); ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ err = 0; ++ } ++ ++ if (!err) { ++ inode->i_nlink--; ++ epilog(dir, dentry, bindex); ++#if 0 ++ xino_write0(sb, bstart, hidden_dentry->d_inode->i_ino); ++ /* ignore this error */ ++#endif ++ goto out_unlock; /* success */ ++ } ++ ++ /* revert */ ++ if (wh_dentry) { ++ int rerr; ++ rerr = do_revert(err, wh_dentry, dentry, bwh, &dt, dlgt); ++ if (rerr) ++ err = rerr; ++ } ++ ++ out_unlock: ++ hdir_unlock(hidden_dir, dir, bindex); ++ dput(wh_dentry); ++ dput(hidden_dentry); ++ out: ++ di_write_unlock(parent); ++ aufs_read_unlock(dentry, AUFS_D_WLOCK); ++ TraceErr(err); ++ return err; ++} ++ ++int aufs_rmdir(struct inode *dir, struct dentry *dentry) ++{ ++ int err, rmdir_later; ++ struct inode *inode, *hidden_dir; ++ struct dentry *parent, *wh_dentry, *hidden_dentry, *hidden_parent; ++ struct dtime dt; ++ aufs_bindex_t bwh, bindex, bstart; ++ struct rmdir_whtmp_arg *arg; ++ struct aufs_nhash *whlist; ++ struct super_block *sb; ++ ++ LKTRTrace("i%lu, %.*s\n", dir->i_ino, DLNPair(dentry)); ++ IMustLock(dir); ++ inode = dentry->d_inode; ++ if (unlikely(!inode)) ++ return -ENOENT; // possible? ++ IMustLock(inode); ++ ++ whlist = nhash_new(GFP_KERNEL); ++ err = PTR_ERR(whlist); ++ if (IS_ERR(whlist)) ++ goto out; ++ ++ err = -ENOMEM; ++ arg = kmalloc(sizeof(*arg), GFP_KERNEL); ++ //arg = NULL; ++ if (unlikely(!arg)) ++ goto out_whlist; ++ ++ aufs_read_lock(dentry, AUFS_D_WLOCK); ++ parent = dentry->d_parent; ++ di_write_lock_parent(parent); ++ err = test_empty(dentry, whlist); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_arg; ++ ++ bstart = dbstart(dentry); ++ bwh = dbwh(dentry); ++ bindex = -1; ++ wh_dentry = lock_hdir_create_wh(dentry, /*isdir*/ 1, &bindex, &dt); ++ //wh_dentry = ERR_PTR(-1); ++ err = PTR_ERR(wh_dentry); ++ if (IS_ERR(wh_dentry)) ++ goto out_arg; ++ ++ hidden_dentry = au_h_dptr(dentry); ++ dget(hidden_dentry); ++ hidden_parent = hidden_dentry->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ ++ rmdir_later = 0; ++ if (bindex == bstart) { ++ IMustLock(hidden_dir); ++ err = renwh_and_rmdir(dentry, bstart, whlist, dir); ++ //err = -1; ++ if (err > 0) { ++ rmdir_later = err; ++ err = 0; ++ } ++ } else { ++ DEBUG_ON(!wh_dentry); ++ hidden_parent = wh_dentry->d_parent; ++ DEBUG_ON(hidden_parent != au_h_dptr_i(parent, bindex)); ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ err = 0; ++ } ++ ++ sb = dentry->d_sb; ++ if (!err) { ++ //aufs_bindex_t bi, bend; ++ ++ au_reset_hinotify(inode, /*flags*/0); ++ inode->i_nlink = 0; ++ set_dbdiropq(dentry, -1); ++ epilog(dir, dentry, bindex); ++ ++ if (rmdir_later) { ++ kick_rmdir_whtmp(hidden_dentry, whlist, bstart, dir, ++ inode, arg); ++ arg = NULL; ++ } ++ ++#if 0 ++ bend = dbend(dentry); ++ for (bi = bstart; bi <= bend; bi++) { ++ struct dentry *hd; ++ hd = au_h_dptr_i(dentry, bi); ++ if (hd && hd->d_inode) ++ xino_write0(sb, bi, hd->d_inode->i_ino); ++ /* ignore this error */ ++ } ++#endif ++ ++ goto out_unlock; /* success */ ++ } ++ ++ /* revert */ ++ LKTRLabel(revert); ++ if (wh_dentry) { ++ int rerr; ++ rerr = do_revert(err, wh_dentry, dentry, bwh, &dt, ++ need_dlgt(sb)); ++ if (rerr) ++ err = rerr; ++ } ++ ++ out_unlock: ++ hdir_unlock(hidden_dir, dir, bindex); ++ dput(wh_dentry); ++ dput(hidden_dentry); ++ out_arg: ++ di_write_unlock(parent); ++ aufs_read_unlock(dentry, AUFS_D_WLOCK); ++ kfree(arg); ++ out_whlist: ++ nhash_del(whlist); ++ out: ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/i_op_ren.c b/fs/aufs/i_op_ren.c +new file mode 100755 +index 0000000..08137f9 +--- /dev/null ++++ b/fs/aufs/i_op_ren.c +@@ -0,0 +1,637 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: i_op_ren.c,v 1.39 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++//#include <linux/namei.h> ++#include "aufs.h" ++ ++enum {SRC, DST}; ++struct rename_args { ++ struct dentry *hidden_dentry[2], *parent[2], *hidden_parent[2]; ++ struct aufs_nhash whlist; ++ aufs_bindex_t btgt, bstart[2]; ++ struct super_block *sb; ++ ++ unsigned int isdir:1; ++ unsigned int issamedir:1; ++ unsigned int whsrc:1; ++ unsigned int whdst:1; ++ unsigned int dlgt:1; ++} __attribute__((aligned(sizeof(long)))); ++ ++static int do_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry, ++ struct rename_args *a) ++{ ++ int err, need_diropq, bycpup, rerr; ++ struct rmdir_whtmp_arg *tharg; ++ struct dentry *wh_dentry[2], *hidden_dst, *hg_parent; ++ struct inode *hidden_dir[2]; ++ aufs_bindex_t bindex, bend; ++ unsigned int flags; ++ struct lkup_args lkup = {.dlgt = a->dlgt}; ++ ++ LKTRTrace("%.*s/%.*s, %.*s/%.*s, " ++ "hd{%p, %p}, hp{%p, %p}, wh %p, btgt %d, bstart{%d, %d}, " ++ "flags{%d, %d, %d, %d}\n", ++ DLNPair(a->parent[SRC]), DLNPair(src_dentry), ++ DLNPair(a->parent[DST]), DLNPair(dentry), ++ a->hidden_dentry[SRC], a->hidden_dentry[DST], ++ a->hidden_parent[SRC], a->hidden_parent[DST], ++ &a->whlist, a->btgt, ++ a->bstart[SRC], a->bstart[DST], ++ a->isdir, a->issamedir, a->whsrc, a->whdst); ++ hidden_dir[SRC] = a->hidden_parent[SRC]->d_inode; ++ hidden_dir[DST] = a->hidden_parent[DST]->d_inode; ++ IMustLock(hidden_dir[SRC]); ++ IMustLock(hidden_dir[DST]); ++ ++ /* prepare workqueue arg */ ++ hidden_dst = NULL; ++ tharg = NULL; ++ if (a->isdir && a->hidden_dentry[DST]->d_inode) { ++ err = -ENOMEM; ++ tharg = kmalloc(sizeof(*tharg), GFP_KERNEL); ++ //tharg = NULL; ++ if (unlikely(!tharg)) ++ goto out; ++ hidden_dst = dget(a->hidden_dentry[DST]); ++ } ++ ++ wh_dentry[SRC] = wh_dentry[DST] = NULL; ++ lkup.nfsmnt = au_nfsmnt(a->sb, a->btgt); ++ /* create whiteout for src_dentry */ ++ if (a->whsrc) { ++ wh_dentry[SRC] = simple_create_wh(src_dentry, a->btgt, ++ a->hidden_parent[SRC], &lkup); ++ //wh_dentry[SRC] = ERR_PTR(-1); ++ err = PTR_ERR(wh_dentry[SRC]); ++ if (IS_ERR(wh_dentry[SRC])) ++ goto out_tharg; ++ } ++ ++ /* lookup whiteout for dentry */ ++ if (a->whdst) { ++ struct dentry *d; ++ d = lkup_wh(a->hidden_parent[DST], &dentry->d_name, &lkup); ++ //d = ERR_PTR(-1); ++ err = PTR_ERR(d); ++ if (IS_ERR(d)) ++ goto out_whsrc; ++ if (!d->d_inode) ++ dput(d); ++ else ++ wh_dentry[DST] = d; ++ } ++ ++ /* rename dentry to tmpwh */ ++ if (tharg) { ++ err = rename_whtmp(dentry, a->btgt); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_whdst; ++ set_h_dptr(dentry, a->btgt, NULL); ++ err = lkup_neg(dentry, a->btgt); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_whtmp; ++ a->hidden_dentry[DST] = au_h_dptr_i(dentry, a->btgt); ++ } ++ ++ /* cpup src */ ++ if (a->hidden_dentry[DST]->d_inode && a->bstart[SRC] != a->btgt) { ++ flags = au_flags_cpup(!CPUP_DTIME, a->parent[SRC]); ++ hg_parent = a->hidden_parent[SRC]->d_parent; ++ if (!(flags & CPUP_LOCKED_GHDIR) ++ && hg_parent == a->hidden_parent[DST]) ++ flags |= CPUP_LOCKED_GHDIR; ++ ++ hi_lock_child(a->hidden_dentry[SRC]->d_inode); ++ err = sio_cpup_simple(src_dentry, a->btgt, -1, flags); ++ //err = -1; // untested dir ++ i_unlock(a->hidden_dentry[SRC]->d_inode); ++ if (unlikely(err)) ++ goto out_whtmp; ++ } ++ ++#if 0 ++ /* clear the target ino in xino */ ++ LKTRTrace("dir %d, dst inode %p\n", a->isdir, a->hidden_dentry[DST]->d_inode); ++ if (a->isdir && a->hidden_dentry[DST]->d_inode) { ++ Dbg("here\n"); ++ err = xino_write(a->sb, a->btgt, ++ a->hidden_dentry[DST]->d_inode->i_ino, 0); ++ if (unlikely(err)) ++ goto out_whtmp; ++ } ++#endif ++ ++ /* rename by vfs_rename or cpup */ ++ need_diropq = a->isdir ++ && (wh_dentry[DST] ++ || dbdiropq(dentry) == a->btgt ++ || au_flag_test(a->sb, AuFlag_ALWAYS_DIROPQ)); ++ bycpup = 0; ++ if (dbstart(src_dentry) == a->btgt) { ++ if (need_diropq && dbdiropq(src_dentry) == a->btgt) ++ need_diropq = 0; ++ err = vfsub_rename(hidden_dir[SRC], au_h_dptr(src_dentry), ++ hidden_dir[DST], a->hidden_dentry[DST], ++ a->dlgt); ++ //err = -1; ++ } else { ++ bycpup = 1; ++ flags = au_flags_cpup(!CPUP_DTIME, a->parent[DST]); ++ hg_parent = a->hidden_parent[DST]->d_parent; ++ if (!(flags & CPUP_LOCKED_GHDIR) ++ && hg_parent == a->hidden_parent[SRC]) ++ flags |= CPUP_LOCKED_GHDIR; ++ ++ hi_lock_child(a->hidden_dentry[SRC]->d_inode); ++ set_dbstart(src_dentry, a->btgt); ++ set_h_dptr(src_dentry, a->btgt, dget(a->hidden_dentry[DST])); ++ //DbgDentry(src_dentry); ++ //DbgInode(src_dentry->d_inode); ++ err = sio_cpup_single(src_dentry, a->btgt, a->bstart[SRC], -1, ++ flags); ++ //err = -1; // untested dir ++ if (unlikely(err)) { ++ set_h_dptr(src_dentry, a->btgt, NULL); ++ set_dbstart(src_dentry, a->bstart[SRC]); ++ } ++ i_unlock(a->hidden_dentry[SRC]->d_inode); ++ } ++ if (unlikely(err)) ++ goto out_whtmp; ++ ++ /* make dir opaque */ ++ if (need_diropq) { ++ struct dentry *diropq; ++ struct inode *h_inode; ++ ++ h_inode = au_h_dptr_i(src_dentry, a->btgt)->d_inode; ++ hdir_lock(h_inode, src_dentry->d_inode, a->btgt); ++ diropq = create_diropq(src_dentry, a->btgt, a->dlgt); ++ //diropq = ERR_PTR(-1); ++ hdir_unlock(h_inode, src_dentry->d_inode, a->btgt); ++ err = PTR_ERR(diropq); ++ if (IS_ERR(diropq)) ++ goto out_rename; ++ dput(diropq); ++ } ++ ++ /* remove whiteout for dentry */ ++ if (wh_dentry[DST]) { ++ err = au_unlink_wh_dentry(hidden_dir[DST], wh_dentry[DST], ++ dentry, a->dlgt); ++ //err = -1; ++ if (unlikely(err)) ++ goto out_diropq; ++ } ++ ++ /* remove whtmp */ ++ if (tharg) { ++ if (au_is_nfs(hidden_dst->d_sb) ++ || !is_longer_wh(&a->whlist, a->btgt, ++ stosi(a->sb)->si_dirwh)) { ++ err = rmdir_whtmp(hidden_dst, &a->whlist, a->btgt, dir, ++ dentry->d_inode); ++ if (unlikely(err)) ++ Warn("failed removing whtmp dir %.*s (%d), " ++ "ignored.\n", DLNPair(hidden_dst), err); ++ } else { ++ kick_rmdir_whtmp(hidden_dst, &a->whlist, a->btgt, dir, ++ dentry->d_inode, tharg); ++ dput(hidden_dst); ++ tharg = NULL; ++ } ++ } ++ err = 0; ++ goto out_success; ++ ++#define RevertFailure(fmt, args...) do { \ ++ IOErrWhck("revert failure: " fmt " (%d, %d)\n", \ ++ ##args, err, rerr); \ ++ err = -EIO; \ ++ } while(0) ++ ++ out_diropq: ++ if (need_diropq) { ++ struct inode *h_inode; ++ ++ h_inode = au_h_dptr_i(src_dentry, a->btgt)->d_inode; ++ // i_lock simplly since inotify is not set to h_inode. ++ hi_lock_parent(h_inode); ++ //hdir_lock(h_inode, src_dentry->d_inode, a->btgt); ++ rerr = remove_diropq(src_dentry, a->btgt, a->dlgt); ++ //rerr = -1; ++ //hdir_unlock(h_inode, src_dentry->d_inode, a->btgt); ++ i_unlock(h_inode); ++ if (rerr) ++ RevertFailure("remove diropq %.*s", ++ DLNPair(src_dentry)); ++ } ++ out_rename: ++ if (!bycpup) { ++ struct dentry *d; ++ struct qstr *name = &src_dentry->d_name; ++ d = lkup_one(name->name, a->hidden_parent[SRC], name->len, ++ &lkup); ++ //d = ERR_PTR(-1); ++ rerr = PTR_ERR(d); ++ if (IS_ERR(d)) { ++ RevertFailure("lkup_one %.*s", DLNPair(src_dentry)); ++ goto out_whtmp; ++ } ++ DEBUG_ON(d->d_inode); ++ rerr = vfsub_rename ++ (hidden_dir[DST], au_h_dptr_i(src_dentry, a->btgt), ++ hidden_dir[SRC], d, a->dlgt); ++ //rerr = -1; ++ d_drop(d); ++ dput(d); ++ //set_h_dptr(src_dentry, a->btgt, NULL); ++ if (rerr) ++ RevertFailure("rename %.*s", DLNPair(src_dentry)); ++ } else { ++ rerr = vfsub_unlink(hidden_dir[DST], a->hidden_dentry[DST], ++ a->dlgt); ++ //rerr = -1; ++ set_h_dptr(src_dentry, a->btgt, NULL); ++ set_dbstart(src_dentry, a->bstart[SRC]); ++ if (rerr) ++ RevertFailure("unlink %.*s", ++ DLNPair(a->hidden_dentry[DST])); ++ } ++ out_whtmp: ++ if (tharg) { ++ struct dentry *d; ++ struct qstr *name = &dentry->d_name; ++ LKTRLabel(here); ++ d = lkup_one(name->name, a->hidden_parent[DST], name->len, ++ &lkup); ++ //d = ERR_PTR(-1); ++ rerr = PTR_ERR(d); ++ if (IS_ERR(d)) { ++ RevertFailure("lookup %.*s", LNPair(name)); ++ goto out_whdst; ++ } ++ if (d->d_inode) { ++ d_drop(d); ++ dput(d); ++ goto out_whdst; ++ } ++ DEBUG_ON(d->d_inode); ++ rerr = vfsub_rename(hidden_dir[DST], hidden_dst, ++ hidden_dir[DST], d, a->dlgt); ++ //rerr = -1; ++ d_drop(d); ++ dput(d); ++ if (rerr) { ++ RevertFailure("rename %.*s", DLNPair(hidden_dst)); ++ goto out_whdst; ++ } ++ set_h_dptr(dentry, a->btgt, NULL); ++ set_h_dptr(dentry, a->btgt, dget(hidden_dst)); ++ } ++ out_whdst: ++ dput(wh_dentry[DST]); ++ wh_dentry[DST] = NULL; ++ out_whsrc: ++ if (wh_dentry[SRC]) { ++ LKTRLabel(here); ++ rerr = au_unlink_wh_dentry(hidden_dir[SRC], wh_dentry[SRC], ++ src_dentry, a->dlgt); ++ //rerr = -1; ++ if (rerr) ++ RevertFailure("unlink %.*s", DLNPair(wh_dentry[SRC])); ++ } ++#undef RevertFailure ++ d_drop(src_dentry); ++ bend = dbend(src_dentry); ++ for (bindex = dbstart(src_dentry); bindex <= bend; bindex++) { ++ struct dentry *hd; ++ hd = au_h_dptr_i(src_dentry, bindex); ++ if (hd) ++ d_drop(hd); ++ } ++ d_drop(dentry); ++ bend = dbend(dentry); ++ for (bindex = dbstart(dentry); bindex <= bend; bindex++) { ++ struct dentry *hd; ++ hd = au_h_dptr_i(dentry, bindex); ++ if (hd) ++ d_drop(hd); ++ } ++ au_update_dbstart(dentry); ++ if (tharg) ++ d_drop(hidden_dst); ++ out_success: ++ dput(wh_dentry[SRC]); ++ dput(wh_dentry[DST]); ++ out_tharg: ++ if (tharg) { ++ dput(hidden_dst); ++ kfree(tharg); ++ } ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * test if @dentry dir can be rename destination or not. ++ * success means, it is a logically empty dir. ++ */ ++static int may_rename_dstdir(struct dentry *dentry, aufs_bindex_t btgt, ++ struct aufs_nhash *whlist) ++{ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ ++ return test_empty(dentry, whlist); ++} ++ ++/* ++ * test if @dentry dir can be rename source or not. ++ * if it can, return 0 and @children is filled. ++ * success means, ++ * - or, it is a logically empty dir. ++ * - or, it exists on writable branch and has no children including whiteouts ++ * on the lower branch. ++ */ ++static int may_rename_srcdir(struct dentry *dentry, aufs_bindex_t btgt) ++{ ++ int err; ++ aufs_bindex_t bstart; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ ++ bstart = dbstart(dentry); ++ if (bstart != btgt) { ++ struct aufs_nhash *whlist; ++ ++ whlist = nhash_new(GFP_KERNEL); ++ err = PTR_ERR(whlist); ++ if (IS_ERR(whlist)) ++ goto out; ++ err = test_empty(dentry, whlist); ++ nhash_del(whlist); ++ goto out; ++ } ++ ++ if (bstart == dbtaildir(dentry)) ++ return 0; /* success */ ++ ++ err = au_test_empty_lower(dentry); ++ ++ out: ++ if (/* unlikely */(err == -ENOTEMPTY)) ++ err = -EXDEV; ++ TraceErr(err); ++ return err; ++} ++ ++int aufs_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry) ++{ ++ int err, do_dt_dstdir; ++ aufs_bindex_t bend, bindex; ++ struct inode *inode, *dirs[2]; ++ enum {PARENT, CHILD}; ++ /* reduce stack space */ ++ struct { ++ struct rename_args a; ++ struct dtime dt[2][2]; ++ } *p; ++ ++ LKTRTrace("i%lu, %.*s, i%lu, %.*s\n", ++ src_dir->i_ino, DLNPair(src_dentry), ++ dir->i_ino, DLNPair(dentry)); ++ IMustLock(src_dir); ++ IMustLock(dir); ++ /* braces are added to stop a warning */ ++ if (dentry->d_inode) { ++ IMustLock(dentry->d_inode); ++ } ++ ++ err = -ENOMEM; ++ BUILD_BUG_ON(sizeof(*p) > PAGE_SIZE); ++ p = kmalloc(sizeof(*p), GFP_KERNEL); ++ if (unlikely(!p)) ++ goto out; ++ ++ err = -ENOTDIR; ++ p->a.sb = src_dentry->d_sb; ++ inode = src_dentry->d_inode; ++ p->a.isdir = !!S_ISDIR(inode->i_mode); ++ if (unlikely(p->a.isdir && dentry->d_inode ++ && !S_ISDIR(dentry->d_inode->i_mode))) ++ goto out_free; ++ ++ aufs_read_and_write_lock2(dentry, src_dentry, p->a.isdir); ++ p->a.dlgt = !!need_dlgt(p->a.sb); ++ p->a.parent[SRC] = p->a.parent[DST] = dentry->d_parent; ++ p->a.issamedir = (src_dir == dir); ++ if (p->a.issamedir) ++ di_write_lock_parent(p->a.parent[DST]); ++ else { ++ p->a.parent[SRC] = src_dentry->d_parent; ++ di_write_lock2_parent(p->a.parent[SRC], p->a.parent[DST], ++ /*isdir*/1); ++ } ++ ++ /* which branch we process */ ++ p->a.bstart[DST] = dbstart(dentry); ++ p->a.btgt = err = wr_dir(dentry, 1, src_dentry, /*force_btgt*/-1, ++ /*do_lock_srcdir*/0); ++ if (unlikely(err < 0)) ++ goto out_unlock; ++ ++ /* are they available to be renamed */ ++ err = 0; ++ nhash_init(&p->a.whlist); ++ if (p->a.isdir && dentry->d_inode) { ++ set_dbstart(dentry, p->a.bstart[DST]); ++ err = may_rename_dstdir(dentry, p->a.btgt, &p->a.whlist); ++ set_dbstart(dentry, p->a.btgt); ++ } ++ p->a.hidden_dentry[DST] = au_h_dptr(dentry); ++ if (unlikely(err)) ++ goto out_unlock; ++ //todo: minor optimize, their sb may be same while their bindex differs. ++ p->a.bstart[SRC] = dbstart(src_dentry); ++ p->a.hidden_dentry[SRC] = au_h_dptr(src_dentry); ++ if (p->a.isdir) { ++ err = may_rename_srcdir(src_dentry, p->a.btgt); ++ if (unlikely(err)) ++ goto out_children; ++ } ++ ++ /* prepare the writable parent dir on the same branch */ ++ err = wr_dir_need_wh(src_dentry, p->a.isdir, &p->a.btgt, ++ p->a.issamedir ? NULL : p->a.parent[DST]); ++ if (unlikely(err < 0)) ++ goto out_children; ++ p->a.whsrc = !!err; ++ p->a.whdst = (p->a.bstart[DST] == p->a.btgt); ++ if (!p->a.whdst) { ++ err = cpup_dirs(dentry, p->a.btgt, ++ p->a.issamedir ? NULL : p->a.parent[SRC]); ++ if (unlikely(err)) ++ goto out_children; ++ } ++ ++ p->a.hidden_parent[SRC] = au_h_dptr_i(p->a.parent[SRC], p->a.btgt); ++ p->a.hidden_parent[DST] = au_h_dptr_i(p->a.parent[DST], p->a.btgt); ++ dirs[0] = src_dir; ++ dirs[1] = dir; ++ hdir_lock_rename(p->a.hidden_parent, dirs, p->a.btgt, p->a.issamedir); ++ ++ /* store timestamps to be revertible */ ++ dtime_store(p->dt[PARENT] + SRC, p->a.parent[SRC], ++ p->a.hidden_parent[SRC]); ++ if (!p->a.issamedir) ++ dtime_store(p->dt[PARENT] + DST, p->a.parent[DST], ++ p->a.hidden_parent[DST]); ++ do_dt_dstdir = 0; ++ if (p->a.isdir) { ++ dtime_store(p->dt[CHILD] + SRC, src_dentry, ++ p->a.hidden_dentry[SRC]); ++ if (p->a.hidden_dentry[DST]->d_inode) { ++ do_dt_dstdir = 1; ++ dtime_store(p->dt[CHILD] + DST, dentry, ++ p->a.hidden_dentry[DST]); ++ } ++ } ++ ++ err = do_rename(src_dir, src_dentry, dir, dentry, &p->a); ++ if (unlikely(err)) ++ goto out_dt; ++ hdir_unlock_rename(p->a.hidden_parent, dirs, p->a.btgt, p->a.issamedir); ++ ++ /* update dir attributes */ ++ dir->i_version++; ++ if (p->a.isdir) ++ au_cpup_attr_nlink(dir); ++ if (ibstart(dir) == p->a.btgt) ++ au_cpup_attr_timesizes(dir); ++ ++ if (!p->a.issamedir) { ++ src_dir->i_version++; ++ if (p->a.isdir) ++ au_cpup_attr_nlink(src_dir); ++ if (ibstart(src_dir) == p->a.btgt) ++ au_cpup_attr_timesizes(src_dir); ++ } ++ ++ // is this updating defined in POSIX? ++ if (unlikely(p->a.isdir)) { ++ //i_lock(inode); ++ au_cpup_attr_timesizes(inode); ++ //i_unlock(inode); ++ } ++ ++#if 0 ++ d_drop(src_dentry); ++#else ++ /* dput/iput all lower dentries */ ++ set_dbwh(src_dentry, -1); ++ bend = dbend(src_dentry); ++ for (bindex = p->a.btgt + 1; bindex <= bend; bindex++) { ++ struct dentry *hd; ++ hd = au_h_dptr_i(src_dentry, bindex); ++ if (hd) ++ set_h_dptr(src_dentry, bindex, NULL); ++ } ++ set_dbend(src_dentry, p->a.btgt); ++ ++ bend = ibend(inode); ++ for (bindex = p->a.btgt + 1; bindex <= bend; bindex++) { ++ struct inode *hi; ++ hi = au_h_iptr_i(inode, bindex); ++ if (hi) ++ set_h_iptr(inode, bindex, NULL, 0); ++ } ++ set_ibend(inode, p->a.btgt); ++#endif ++ ++#if 0 ++ //au_debug_on(); ++ //DbgDentry(dentry); ++ //DbgInode(dentry->d_inode); ++ //au_debug_off(); ++ inode = dentry->d_inode; ++ if (inode) { ++ aufs_bindex_t bindex, bend; ++ struct dentry *hd; ++ bend = dbend(dentry); ++ for (bindex = dbstart(dentry); bindex <= bend; bindex++) { ++ hd = au_h_dptr_i(dentry, bindex); ++ if (hd && hd->d_inode) ++ xino_write0(p->a.sb, bindex, hd->d_inode->i_ino); ++ /* ignore this error */ ++ } ++ } ++#endif ++ ++ goto out_children; /* success */ ++ ++ out_dt: ++ dtime_revert(p->dt[PARENT] + SRC, ++ p->a.hidden_parent[SRC]->d_parent ++ == p->a.hidden_parent[DST]); ++ if (!p->a.issamedir) ++ dtime_revert(p->dt[PARENT] + DST, ++ p->a.hidden_parent[DST]->d_parent ++ == p->a.hidden_parent[SRC]); ++ if (p->a.isdir && err != -EIO) { ++ struct dentry *hd; ++ ++ hd = p->dt[CHILD][SRC].dt_h_dentry; ++ hi_lock_child(hd->d_inode); ++ dtime_revert(p->dt[CHILD] + SRC, 1); ++ i_unlock(hd->d_inode); ++ if (do_dt_dstdir) { ++ hd = p->dt[CHILD][DST].dt_h_dentry; ++ hi_lock_child(hd->d_inode); ++ dtime_revert(p->dt[CHILD] + DST, 1); ++ i_unlock(hd->d_inode); ++ } ++ } ++ hdir_unlock_rename(p->a.hidden_parent, dirs, p->a.btgt, p->a.issamedir); ++ out_children: ++ nhash_fin(&p->a.whlist); ++ out_unlock: ++ //if (unlikely(err /* && p->a.isdir */)) { ++ if (unlikely(err && p->a.isdir)) { ++ au_update_dbstart(dentry); ++ d_drop(dentry); ++ } ++ if (p->a.issamedir) ++ di_write_unlock(p->a.parent[DST]); ++ else ++ di_write_unlock2(p->a.parent[SRC], p->a.parent[DST]); ++ aufs_read_and_write_unlock2(dentry, src_dentry); ++ out_free: ++ kfree(p); ++ out: ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/iinfo.c b/fs/aufs/iinfo.c +new file mode 100755 +index 0000000..9efbd38 +--- /dev/null ++++ b/fs/aufs/iinfo.c +@@ -0,0 +1,286 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: iinfo.c,v 1.31 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++//#include <linux/mm.h> ++#include "aufs.h" ++ ++struct aufs_iinfo *itoii(struct inode *inode) ++{ ++ struct aufs_iinfo *iinfo; ++ ++ iinfo = &(container_of(inode, struct aufs_icntnr, vfs_inode)->iinfo); ++ /* bad_inode case */ ++ if (unlikely(!iinfo->ii_hinode)) ++ return NULL; ++ DEBUG_ON(!iinfo->ii_hinode ++ /* || stosi(inode->i_sb)->si_bend < iinfo->ii_bend */ ++ || iinfo->ii_bend < iinfo->ii_bstart); ++ return iinfo; ++} ++ ++aufs_bindex_t ibstart(struct inode *inode) ++{ ++ IiMustAnyLock(inode); ++ return itoii(inode)->ii_bstart; ++} ++ ++aufs_bindex_t ibend(struct inode *inode) ++{ ++ IiMustAnyLock(inode); ++ return itoii(inode)->ii_bend; ++} ++ ++struct aufs_vdir *ivdir(struct inode *inode) ++{ ++ IiMustAnyLock(inode); ++ DEBUG_ON(!S_ISDIR(inode->i_mode)); ++ return itoii(inode)->ii_vdir; ++} ++ ++struct inode *au_h_iptr_i(struct inode *inode, aufs_bindex_t bindex) ++{ ++ struct inode *hidden_inode; ++ ++ IiMustAnyLock(inode); ++ DEBUG_ON(bindex < 0 || ibend(inode) < bindex); ++ hidden_inode = itoii(inode)->ii_hinode[0 + bindex].hi_inode; ++ DEBUG_ON(hidden_inode && atomic_read(&hidden_inode->i_count) <= 0); ++ return hidden_inode; ++} ++ ++struct inode *au_h_iptr(struct inode *inode) ++{ ++ return au_h_iptr_i(inode, ibstart(inode)); ++} ++ ++aufs_bindex_t itoid_index(struct inode *inode, aufs_bindex_t bindex) ++{ ++ IiMustAnyLock(inode); ++ DEBUG_ON(bindex < 0 ++ || ibend(inode) < bindex ++ || !itoii(inode)->ii_hinode[0 + bindex].hi_inode); ++ return itoii(inode)->ii_hinode[0 + bindex].hi_id; ++} ++ ++// hard/soft set ++void set_ibstart(struct inode *inode, aufs_bindex_t bindex) ++{ ++ struct aufs_iinfo *iinfo = itoii(inode); ++ struct inode *h_inode; ++ ++ IiMustWriteLock(inode); ++ DEBUG_ON(sbend(inode->i_sb) < bindex); ++ iinfo->ii_bstart = bindex; ++ h_inode = iinfo->ii_hinode[bindex + 0].hi_inode; ++ if (h_inode) ++ au_cpup_igen(inode, h_inode); ++} ++ ++void set_ibend(struct inode *inode, aufs_bindex_t bindex) ++{ ++ IiMustWriteLock(inode); ++ DEBUG_ON(sbend(inode->i_sb) < bindex ++ || bindex < ibstart(inode)); ++ itoii(inode)->ii_bend = bindex; ++} ++ ++void set_ivdir(struct inode *inode, struct aufs_vdir *vdir) ++{ ++ IiMustWriteLock(inode); ++ DEBUG_ON(!S_ISDIR(inode->i_mode) ++ || (itoii(inode)->ii_vdir && vdir)); ++ itoii(inode)->ii_vdir = vdir; ++} ++ ++void aufs_hiput(struct aufs_hinode *hinode) ++{ ++ if (unlikely(hinode->hi_notify)) ++ do_free_hinotify(hinode); ++ if (hinode->hi_inode) ++ iput(hinode->hi_inode); ++} ++ ++unsigned int au_hi_flags(struct inode *inode, int isdir) ++{ ++ unsigned int flags; ++ struct super_block *sb = inode->i_sb; ++ ++ flags = 0; ++ if (au_flag_test(sb, AuFlag_XINO)) ++ flags = AUFS_HI_XINO; ++ if (unlikely(isdir && au_flag_test(sb, AuFlag_UDBA_INOTIFY))) ++ flags |= AUFS_HI_NOTIFY; ++ return flags; ++} ++ ++void set_h_iptr(struct inode *inode, aufs_bindex_t bindex, ++ struct inode *h_inode, unsigned int flags) ++{ ++ struct aufs_hinode *hinode; ++ struct inode *hi; ++ struct aufs_iinfo *iinfo = itoii(inode); ++ ++ LKTRTrace("i%lu, b%d, hi%lu, flags 0x%x\n", ++ inode->i_ino, bindex, h_inode ? h_inode->i_ino : 0, flags); ++ IiMustWriteLock(inode); ++ hinode = iinfo->ii_hinode + bindex; ++ hi = hinode->hi_inode; ++ DEBUG_ON(bindex < ibstart(inode) || ibend(inode) < bindex ++ || (h_inode && atomic_read(&h_inode->i_count) <= 0) ++ || (h_inode && hi)); ++ ++ if (hi) ++ aufs_hiput(hinode); ++ hinode->hi_inode = h_inode; ++ if (h_inode) { ++ int err; ++ struct super_block *sb = inode->i_sb; ++ ++ if (bindex == iinfo->ii_bstart) ++ au_cpup_igen(inode, h_inode); ++ hinode->hi_id = sbr_id(sb, bindex); ++ if (flags & AUFS_HI_XINO) { ++ struct xino xino = { ++ .ino = inode->i_ino, ++ //.h_gen = h_inode->i_generation ++ }; ++ //WARN_ON(xino.h_gen == AuXino_INVALID_HGEN); ++ err = xino_write(sb, bindex, h_inode->i_ino, &xino); ++ if (unlikely(err)) { ++ IOErr1("failed xino_write() %d, force noxino\n", ++ err); ++ au_flag_clr(sb, AuFlag_XINO); ++ } ++ } ++ if (flags & AUFS_HI_NOTIFY) { ++ err = alloc_hinotify(hinode, inode, h_inode); ++ if (unlikely(err)) ++ IOErr1("alloc_hinotify() %d\n", err); ++ else { ++ /* braces are added to stop a warning */ ++ DEBUG_ON(!hinode->hi_notify); ++ } ++ } ++ } ++} ++ ++void au_update_iigen(struct inode *inode) ++{ ++ //IiMustWriteLock(inode); ++ DEBUG_ON(!inode->i_sb); ++ atomic_set(&itoii(inode)->ii_generation, au_sigen(inode->i_sb)); ++} ++ ++/* it may be called at remount time, too */ ++void au_update_brange(struct inode *inode, int do_put_zero) ++{ ++ struct aufs_iinfo *iinfo; ++ ++ LKTRTrace("i%lu, %d\n", inode->i_ino, do_put_zero); ++ IiMustWriteLock(inode); ++ ++ iinfo = itoii(inode); ++ if (unlikely(!iinfo) || iinfo->ii_bstart < 0) ++ return; ++ ++ if (do_put_zero) { ++ aufs_bindex_t bindex; ++ for (bindex = iinfo->ii_bstart; bindex <= iinfo->ii_bend; ++ bindex++) { ++ struct inode *h_i; ++ h_i = iinfo->ii_hinode[0 + bindex].hi_inode; ++ if (h_i && !h_i->i_nlink) ++ set_h_iptr(inode, bindex, NULL, 0); ++ } ++ } ++ ++ iinfo->ii_bstart = -1; ++ while (++iinfo->ii_bstart <= iinfo->ii_bend) ++ if (iinfo->ii_hinode[0 + iinfo->ii_bstart].hi_inode) ++ break; ++ if (iinfo->ii_bstart > iinfo->ii_bend) { ++ iinfo->ii_bend = iinfo->ii_bstart = -1; ++ return; ++ } ++ ++ iinfo->ii_bend++; ++ while (0 <= --iinfo->ii_bend) ++ if (iinfo->ii_hinode[0 + iinfo->ii_bend].hi_inode) ++ break; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++int au_iinfo_init(struct inode *inode) ++{ ++ struct aufs_iinfo *iinfo; ++ struct super_block *sb; ++ int nbr, i; ++ ++ sb = inode->i_sb; ++ DEBUG_ON(!sb); ++ iinfo = &(container_of(inode, struct aufs_icntnr, vfs_inode)->iinfo); ++ DEBUG_ON(iinfo->ii_hinode); ++ nbr = sbend(sb) + 1; ++ if (unlikely(!nbr)) ++ nbr++; ++ iinfo->ii_hinode = kcalloc(nbr, sizeof(*iinfo->ii_hinode), GFP_KERNEL); ++ //iinfo->ii_hinode = NULL; ++ if (iinfo->ii_hinode) { ++ for (i = 0; i < nbr; i++) ++ iinfo->ii_hinode[i].hi_id = -1; ++ atomic_set(&iinfo->ii_generation, au_sigen(sb)); ++ rw_init_nolock(&iinfo->ii_rwsem); ++ iinfo->ii_bstart = -1; ++ iinfo->ii_bend = -1; ++ iinfo->ii_vdir = NULL; ++ return 0; ++ } ++ return -ENOMEM; ++} ++ ++void au_iinfo_fin(struct inode *inode) ++{ ++ struct aufs_iinfo *iinfo; ++ ++ iinfo = itoii(inode); ++ /* bad_inode case */ ++ if (unlikely(!iinfo)) ++ return; ++ ++ if (unlikely(iinfo->ii_vdir)) ++ free_vdir(iinfo->ii_vdir); ++ ++ if (iinfo->ii_bstart >= 0) { ++ aufs_bindex_t bend; ++ struct aufs_hinode *hi; ++ hi = iinfo->ii_hinode + iinfo->ii_bstart; ++ bend = iinfo->ii_bend; ++ while (iinfo->ii_bstart++ <= bend) { ++ if (hi->hi_inode) ++ aufs_hiput(hi); ++ hi++; ++ } ++ //iinfo->ii_bstart = iinfo->ii_bend = -1; ++ } ++ ++ kfree(iinfo->ii_hinode); ++ //iinfo->ii_hinode = NULL; ++} +diff --git a/fs/aufs/inode.c b/fs/aufs/inode.c +new file mode 100755 +index 0000000..f18b5d8 +--- /dev/null ++++ b/fs/aufs/inode.c +@@ -0,0 +1,339 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: inode.c,v 1.22 2007/05/07 03:44:35 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++int au_refresh_hinode(struct inode *inode, struct dentry *dentry) ++{ ++ int err, new_sz, update, isdir; ++ struct inode *first; ++ struct aufs_hinode *p, *q, tmp; ++ struct super_block *sb; ++ struct aufs_iinfo *iinfo; ++ aufs_bindex_t bindex, bend, new_bindex; ++ unsigned int flags; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ IiMustWriteLock(inode); ++ ++ err = -ENOMEM; ++ sb = dentry->d_sb; ++ bend = sbend(sb); ++ new_sz = sizeof(*iinfo->ii_hinode) * (bend + 1); ++ iinfo = itoii(inode); ++ p = au_kzrealloc(iinfo->ii_hinode, sizeof(*p) * (iinfo->ii_bend + 1), ++ new_sz, GFP_KERNEL); ++ //p = NULL; ++ if (unlikely(!p)) ++ goto out; ++ ++ iinfo->ii_hinode = p; ++ err = 0; ++ update = 0; ++ p = iinfo->ii_hinode + iinfo->ii_bstart; ++ first = p->hi_inode; ++ for (bindex = iinfo->ii_bstart; bindex <= iinfo->ii_bend; ++ bindex++, p++) { ++ if (unlikely(!p->hi_inode)) ++ continue; ++ ++ new_bindex = find_brindex(sb, p->hi_id); ++ if (new_bindex == bindex) ++ continue; ++ if (new_bindex < 0) { ++ update++; ++ aufs_hiput(p); ++ p->hi_inode = NULL; ++ continue; ++ } ++ ++ if (new_bindex < iinfo->ii_bstart) ++ iinfo->ii_bstart = new_bindex; ++ if (iinfo->ii_bend < new_bindex) ++ iinfo->ii_bend = new_bindex; ++ /* swap two hidden inode, and loop again */ ++ q = iinfo->ii_hinode + new_bindex; ++ tmp = *q; ++ *q = *p; ++ *p = tmp; ++ if (tmp.hi_inode) { ++ bindex--; ++ p--; ++ } ++ } ++ ++ isdir = S_ISDIR(inode->i_mode); ++ flags = au_hi_flags(inode, isdir); ++ bend = dbend(dentry); ++ for (bindex = dbstart(dentry); bindex <= bend; bindex++) { ++ struct inode *hi; ++ struct dentry *hd; ++ ++ hd = au_h_dptr_i(dentry, bindex); ++ if (!hd || !hd->d_inode) ++ continue; ++ ++ if (iinfo->ii_bstart <= bindex && bindex <= iinfo->ii_bend) { ++ hi = au_h_iptr_i(inode, bindex); ++ if (hi) { ++ if (hi == hd->d_inode) ++ continue; ++ //Dbg("here\n"); ++ err = -ESTALE; ++ break; ++ } ++ } ++ if (bindex < iinfo->ii_bstart) ++ iinfo->ii_bstart = bindex; ++ if (iinfo->ii_bend < bindex) ++ iinfo->ii_bend = bindex; ++ set_h_iptr(inode, bindex, igrab(hd->d_inode), flags); ++ update++; ++ } ++ ++ bend = iinfo->ii_bend; ++ p = iinfo->ii_hinode; ++ for (bindex = 0; bindex <= bend; bindex++, p++) ++ if (p->hi_inode) { ++ iinfo->ii_bstart = bindex; ++ break; ++ } ++ p = iinfo->ii_hinode + bend; ++ for (bindex = bend; bindex > iinfo->ii_bstart; bindex--, p--) ++ if (p->hi_inode) { ++ iinfo->ii_bend = bindex; ++ break; ++ } ++ DEBUG_ON(iinfo->ii_bstart > bend || iinfo->ii_bend < 0); ++ ++ if (unlikely(err)) ++ goto out; ++ ++ if (1 || first != au_h_iptr(inode)) ++ au_cpup_attr_all(inode); ++ if (update && isdir) ++ inode->i_version++; ++ au_update_iigen(inode); ++ ++ out: ++ //au_debug_on(); ++ TraceErr(err); ++ //au_debug_off(); ++ return err; ++} ++ ++static int set_inode(struct inode *inode, struct dentry *dentry) ++{ ++ int err, isdir; ++ struct dentry *hidden_dentry; ++ struct inode *hidden_inode; ++ umode_t mode; ++ aufs_bindex_t bindex, bstart, btail; ++ struct aufs_iinfo *iinfo; ++ unsigned int flags; ++ ++ LKTRTrace("i%lu, %.*s\n", inode->i_ino, DLNPair(dentry)); ++ DEBUG_ON(!(inode->i_state & I_NEW)); ++ IiMustWriteLock(inode); ++ hidden_dentry = au_h_dptr(dentry); ++ DEBUG_ON(!hidden_dentry); ++ hidden_inode = hidden_dentry->d_inode; ++ DEBUG_ON(!hidden_inode); ++ ++ err = 0; ++ isdir = 0; ++ bstart = dbstart(dentry); ++ mode = hidden_inode->i_mode; ++ switch (mode & S_IFMT) { ++ case S_IFREG: ++ btail = dbtail(dentry); ++ break; ++ case S_IFDIR: ++ isdir = 1; ++ btail = dbtaildir(dentry); ++ inode->i_op = &aufs_dir_iop; ++ inode->i_fop = &aufs_dir_fop; ++ break; ++ case S_IFLNK: ++ btail = dbtail(dentry); ++ inode->i_op = &aufs_symlink_iop; ++ break; ++ case S_IFBLK: ++ case S_IFCHR: ++ case S_IFIFO: ++ case S_IFSOCK: ++ btail = dbtail(dentry); ++ init_special_inode(inode, mode, hidden_inode->i_rdev); ++ break; ++ default: ++ IOErr("Unknown file type 0%o\n", mode); ++ err = -EIO; ++ goto out; ++ } ++ ++ flags = au_hi_flags(inode, isdir); ++ iinfo = itoii(inode); ++ iinfo->ii_bstart = bstart; ++ iinfo->ii_bend = btail; ++ for (bindex = bstart; bindex <= btail; bindex++) { ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (!hidden_dentry) ++ continue; ++ DEBUG_ON(!hidden_dentry->d_inode); ++ set_h_iptr(inode, bindex, igrab(hidden_dentry->d_inode), flags); ++ } ++ au_cpup_attr_all(inode); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* successful returns with iinfo write_locked */ ++//todo: return with unlocked? ++static int reval_inode(struct inode *inode, struct dentry *dentry, int *matched) ++{ ++ int err; ++ struct inode *h_inode, *h_dinode; ++ aufs_bindex_t bindex, bend; ++ //const int udba = !au_flag_test(inode->i_sb, AuFlag_UDBA_NONE); ++ ++ LKTRTrace("i%lu, %.*s\n", inode->i_ino, DLNPair(dentry)); ++ ++ *matched = 0; ++ ++ /* ++ * before this function, if aufs got any iinfo lock, it must be only ++ * one, the parent dir. ++ * it can happen by UDBA and the obsoleted inode number. ++ */ ++ err = -EIO; ++ if (unlikely(inode->i_ino == parent_ino(dentry))) ++ goto out; ++ ++ h_dinode = au_h_dptr(dentry)->d_inode; ++ hi_lock_child(inode); // bad name, this is not a hidden inode. ++ ii_write_lock_new(inode); ++ bend = ibend(inode); ++ for (bindex = ibstart(inode); bindex <= bend; bindex++) { ++ h_inode = au_h_iptr_i(inode, bindex); ++ if (h_inode && h_inode == h_dinode) { ++ //&& (ibs != bstart || !au_test_higen(inode, h_inode))); ++ *matched = 1; ++ err = 0; ++ if (unlikely(au_iigen(inode) != au_digen(dentry))) ++ err = au_refresh_hinode(inode, dentry); ++ break; ++ } ++ } ++ i_unlock(inode); ++ if (unlikely(err)) ++ ii_write_unlock(inode); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* successful returns with iinfo write_locked */ ++//todo: return with unlocked? ++struct inode *au_new_inode(struct dentry *dentry) ++{ ++ struct inode *inode, *h_inode; ++ struct dentry *h_dentry; ++ ino_t h_ino; ++ struct super_block *sb; ++ int err, match; ++ aufs_bindex_t bstart; ++ struct xino xino; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ sb = dentry->d_sb; ++ h_dentry = au_h_dptr(dentry); ++ DEBUG_ON(!h_dentry); ++ h_inode = h_dentry->d_inode; ++ DEBUG_ON(!h_inode); ++ ++ bstart = dbstart(dentry); ++ h_ino = h_inode->i_ino; ++ err = xino_read(sb, bstart, h_ino, &xino); ++ //err = -1; ++ inode = ERR_PTR(err); ++ if (unlikely(err)) ++ goto out; ++ new_ino: ++ if (!xino.ino) { ++ xino.ino = xino_new_ino(sb); ++ if (!xino.ino) { ++ inode = ERR_PTR(-EIO); ++ goto out; ++ } ++ } ++ ++ LKTRTrace("i%lu\n", xino.ino); ++ err = -ENOMEM; ++ inode = iget_locked(sb, xino.ino); ++ if (unlikely(!inode)) ++ goto out; ++ err = PTR_ERR(inode); ++ if (IS_ERR(inode)) ++ goto out; ++ err = -ENOMEM; ++ if (unlikely(is_bad_inode(inode))) ++ goto out_iput; ++ ++ LKTRTrace("%lx, new %d\n", inode->i_state, !!(inode->i_state & I_NEW)); ++ if (inode->i_state & I_NEW) { ++ sb->s_op->read_inode(inode); ++ if (!is_bad_inode(inode)) { ++ ii_write_lock_new(inode); ++ err = set_inode(inode, dentry); ++ //err = -1; ++ } ++ unlock_new_inode(inode); ++ if (!err) ++ goto out; /* success */ ++ ii_write_unlock(inode); ++ goto out_iput; ++ } else { ++ err = reval_inode(inode, dentry, &match); ++ if (!err) ++ goto out; /* success */ ++ else if (match) ++ goto out_iput; ++ } ++ ++ Warn1("broken ino, b%d, %.*s/%.*s, hi%lu, i%lu. Try udba=inotify.\n", ++ bstart, DLNPair(dentry->d_parent), DLNPair(dentry), h_ino, ++ xino.ino); ++ xino.ino = 0; ++ err = xino_write0(sb, bstart, h_ino); ++ if (!err) { ++ iput(inode); ++ goto new_ino; ++ } ++ ++ out_iput: ++ iput(inode); ++ inode = ERR_PTR(err); ++ out: ++ TraceErrPtr(inode); ++ return inode; ++} +diff --git a/fs/aufs/inode.h b/fs/aufs/inode.h +new file mode 100755 +index 0000000..b001ac3 +--- /dev/null ++++ b/fs/aufs/inode.h +@@ -0,0 +1,377 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: inode.h,v 1.32 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_INODE_H__ ++#define __AUFS_INODE_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/inotify.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++#include "misc.h" ++#include "vfsub.h" ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++#else ++struct inotify_watch {}; ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct aufs_hinotify { ++ struct inotify_watch hin_watch; ++ struct inode *hin_aufs_inode; /* no get/put */ ++}; ++ ++struct aufs_hinode { ++ struct inode *hi_inode; ++ aufs_bindex_t hi_id; ++ struct aufs_hinotify *hi_notify; ++}; ++ ++struct aufs_vdir; ++struct aufs_iinfo { ++ atomic_t ii_generation; ++ struct super_block *ii_hsb1; /* no get/put */ ++ ++ struct aufs_rwsem ii_rwsem; ++ aufs_bindex_t ii_bstart, ii_bend; ++ struct aufs_hinode *ii_hinode; ++ struct aufs_vdir *ii_vdir; ++}; ++ ++struct aufs_icntnr { ++ struct aufs_iinfo iinfo; ++ struct inode vfs_inode; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* inode.c */ ++int au_refresh_hinode(struct inode *inode, struct dentry *dentry); ++struct inode *au_new_inode(struct dentry *dentry); ++ ++/* i_op.c */ ++extern struct inode_operations aufs_iop, aufs_symlink_iop, aufs_dir_iop; ++int wr_dir(struct dentry *dentry, int negative, struct dentry *src_dentry, ++ aufs_bindex_t force_btgt, int do_lock_srcdir); ++ ++/* i_op_del.c */ ++int wr_dir_need_wh(struct dentry *dentry, int isdir, aufs_bindex_t *bcpup, ++ struct dentry *locked); ++ ++/* iinfo.c */ ++struct aufs_iinfo *itoii(struct inode *inode); ++aufs_bindex_t ibstart(struct inode *inode); ++aufs_bindex_t ibend(struct inode *inode); ++struct aufs_vdir *ivdir(struct inode *inode); ++struct inode *au_h_iptr_i(struct inode *inode, aufs_bindex_t bindex); ++struct inode *au_h_iptr(struct inode *inode); ++aufs_bindex_t itoid_index(struct inode *inode, aufs_bindex_t bindex); ++ ++void set_ibstart(struct inode *inode, aufs_bindex_t bindex); ++void set_ibend(struct inode *inode, aufs_bindex_t bindex); ++void set_ivdir(struct inode *inode, struct aufs_vdir *vdir); ++void aufs_hiput(struct aufs_hinode *hinode); ++#define AUFS_HI_XINO 1 ++#define AUFS_HI_NOTIFY 2 ++unsigned int au_hi_flags(struct inode *inode, int isdir); ++void set_h_iptr(struct inode *inode, aufs_bindex_t bindex, ++ struct inode *h_inode, unsigned int flags); ++void au_update_iigen(struct inode *inode); ++void au_update_brange(struct inode *inode, int do_put_zero); ++ ++int au_iinfo_init(struct inode *inode); ++void au_iinfo_fin(struct inode *inode); ++ ++/* plink.c */ ++#ifdef CONFIG_AUFS_DEBUG ++void au_list_plink(struct super_block *sb); ++#else ++static inline void au_list_plink(struct super_block *sb) ++{ ++ /* nothing */ ++} ++#endif ++int au_is_plinked(struct super_block *sb, struct inode *inode); ++struct dentry *lkup_plink(struct super_block *sb, aufs_bindex_t bindex, ++ struct inode *inode); ++void append_plink(struct super_block *sb, struct inode *inode, ++ struct dentry *h_dentry, aufs_bindex_t bindex); ++void au_put_plink(struct super_block *sb); ++void half_refresh_plink(struct super_block *sb, aufs_bindex_t br_id); ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* lock subclass for hidden inode */ ++/* default MAX_LOCKDEP_SUBCLASSES(8) is not enough */ ++// todo: reduce it by dcsub. ++enum { ++ AuLsc_Begin = I_MUTEX_QUOTA, ++ AuLsc_HI_GPARENT, /* setattr with inotify */ ++ AuLsc_HI_PARENT, /* hidden inode, parent first */ ++ AuLsc_HI_CHILD, ++ AuLsc_HI_PARENT2, /* copyup dirs */ ++ AuLsc_HI_CHILD2, ++ AuLsc_End ++}; ++ ++/* simple abstraction */ ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,16) ++static inline void i_lock(struct inode *i) ++{ ++ down(&i->i_sem); ++} ++ ++static inline void i_unlock(struct inode *i) ++{ ++ up(&i->i_sem); ++} ++ ++static inline int i_trylock(struct inode *i) ++{ ++ return down_trylock(&i->i_sem); ++} ++ ++static inline void hi_lock(struct inode *i, unsigned int lsc) ++{ ++ i_lock(i); ++} ++ ++#define IMustLock(i) DEBUG_ON(!down_trylock(&(i)->i_sem)) ++#else ++static inline void i_lock(struct inode *i) ++{ ++ mutex_lock(&i->i_mutex); ++} ++ ++static inline void i_unlock(struct inode *i) ++{ ++ mutex_unlock(&i->i_mutex); ++} ++ ++static inline int i_trylock(struct inode *i) ++{ ++ return mutex_trylock(&i->i_mutex); ++} ++ ++static inline void hi_lock(struct inode *i, unsigned int lsc) ++{ ++ mutex_lock_nested(&i->i_mutex, lsc); ++} ++ ++#define IMustLock(i) MtxMustLock(&(i)->i_mutex) ++#endif ++ ++/* ++ * hi_lock_gparent, hi_lock_parent, hi_lock_parent2, hi_lock_child, ++ * hi_lock_child2, hi_lock_whplink ++ */ ++#define LockFunc(name, lsc) \ ++static inline void hi_lock_##name(struct inode *h_i) \ ++{hi_lock(h_i, AuLsc_HI_##lsc);} ++ ++LockFunc(gparent, GPARENT); ++LockFunc(parent, PARENT); ++LockFunc(parent2, PARENT2); ++LockFunc(child, CHILD); ++LockFunc(child2, CHILD2); ++LockFunc(whplink, CHILD2); /* sharing lock-subclass */ ++ ++#undef LockFunc ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* tiny test for inode number */ ++/* tmpfs generation is too rough */ ++static inline int au_test_higen(struct inode *inode, struct inode *h_inode) ++{ ++ //IiMustAnyLock(inode); ++ return !(itoii(inode)->ii_hsb1 == h_inode->i_sb ++ && inode->i_generation == h_inode->i_generation); ++} ++ ++static inline int au_iigen(struct inode *inode) ++{ ++ return atomic_read(&itoii(inode)->ii_generation); ++} ++ ++#ifdef CONFIG_AUFS_HINOTIFY ++static inline void au_iigen_dec(struct inode *inode) ++{ ++ //Dbg("i%lu\n", inode->i_ino); ++ atomic_dec(&itoii(inode)->ii_generation); ++} ++ ++/* hinotify.c */ ++int alloc_hinotify(struct aufs_hinode *hinode, struct inode *inode, ++ struct inode *h_inode); ++void do_free_hinotify(struct aufs_hinode *hinode); ++void do_hdir_lock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex, ++ unsigned int lsc); ++void hdir_unlock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex); ++void hdir_lock_rename(struct dentry **h_parents, struct inode **dirs, ++ aufs_bindex_t bindex, int issamedir); ++void hdir_unlock_rename(struct dentry **h_parents, struct inode **dirs, ++ aufs_bindex_t bindex, int issamedir); ++void au_reset_hinotify(struct inode *inode, unsigned int flags); ++int __init au_inotify_init(void); ++void au_inotify_fin(void); ++#else ++static inline ++int alloc_hinotify(struct aufs_hinode *hinode, struct inode *inode, ++ struct inode *h_inode) ++{ ++ return -EOPNOTSUPP; ++} ++ ++static inline void do_free_hinotify(struct aufs_hinode *hinode) ++{ ++ /* nothing */ ++} ++ ++static inline ++void do_hdir_lock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex, ++ unsigned int lsc) ++{ ++ hi_lock(h_dir, lsc); ++} ++ ++static inline ++void hdir_unlock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex) ++{ ++ i_unlock(h_dir); ++} ++ ++static inline ++void hdir_lock_rename(struct dentry **h_parents, struct inode **dirs, ++ aufs_bindex_t bindex, int issamedir) ++{ ++ vfsub_lock_rename(h_parents[0], h_parents[1]); ++} ++ ++static inline ++void hdir_unlock_rename(struct dentry **h_parents, struct inode **dirs, ++ aufs_bindex_t bindex, int issamedir) ++{ ++ vfsub_unlock_rename(h_parents[0], h_parents[1]); ++} ++ ++static inline void au_reset_hinotify(struct inode *inode, unsigned int flags) ++{ ++ /* nothing */ ++} ++ ++#define au_inotify_init() 0 ++#define au_inotify_fin() /* */ ++#endif /* CONFIG_AUFS_HINOTIFY */ ++ ++static inline void free_hinotify(struct inode *inode, aufs_bindex_t bindex) ++{ ++ do_free_hinotify(itoii(inode)->ii_hinode + bindex); ++} ++ ++/* ++ * hgdir_lock, hdir_lock, hdir2_lock ++ */ ++#define LockFunc(name, lsc) \ ++static inline \ ++void name##_lock(struct inode *h_dir, struct inode *dir, aufs_bindex_t bindex) \ ++{do_hdir_lock(h_dir, dir, bindex, AuLsc_HI_##lsc);} ++ ++LockFunc(hgdir, GPARENT); ++LockFunc(hdir, PARENT); ++LockFunc(hdir2, PARENT2); ++ ++#undef LockFunc ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* lock subclass for iinfo */ ++enum { ++ AuLsc_II_CHILD, /* child first */ ++ AuLsc_II_CHILD2, /* rename(2), link(2), and cpup at hinotify */ ++ AuLsc_II_CHILD3, /* copyup dirs */ ++ AuLsc_II_PARENT, ++ AuLsc_II_PARENT2, ++ AuLsc_II_PARENT3, ++ AuLsc_II_NEW /* new inode */ ++}; ++ ++/* ++ * ii_read_lock_child, ii_write_lock_child, ++ * ii_read_lock_child2, ii_write_lock_child2, ++ * ii_read_lock_child3, ii_write_lock_child3, ++ * ii_read_lock_parent, ii_write_lock_parent, ++ * ii_read_lock_parent2, ii_write_lock_parent2, ++ * ii_read_lock_parent3, ii_write_lock_parent3, ++ * ii_read_lock_new, ii_write_lock_new ++ */ ++#define ReadLockFunc(name, lsc) \ ++static inline void ii_read_lock_##name(struct inode *i) \ ++{rw_read_lock_nested(&itoii(i)->ii_rwsem, AuLsc_II_##lsc);} ++ ++#define WriteLockFunc(name, lsc) \ ++static inline void ii_write_lock_##name(struct inode *i) \ ++{rw_write_lock_nested(&itoii(i)->ii_rwsem, AuLsc_II_##lsc);} ++ ++#define RWLockFuncs(name, lsc) \ ++ ReadLockFunc(name, lsc); \ ++ WriteLockFunc(name, lsc) ++ ++RWLockFuncs(child, CHILD); ++RWLockFuncs(child2, CHILD2); ++RWLockFuncs(child3, CHILD3); ++RWLockFuncs(parent, PARENT); ++RWLockFuncs(parent2, PARENT2); ++RWLockFuncs(parent3, PARENT3); ++RWLockFuncs(new, NEW); ++ ++#undef ReadLockFunc ++#undef WriteLockFunc ++#undef RWLockFunc ++ ++/* ++ * ii_read_unlock, ii_write_unlock, ii_downgrade_lock ++ */ ++SimpleUnlockRwsemFuncs(ii, struct inode *i, itoii(i)->ii_rwsem); ++ ++/* to debug easier, do not make them inlined functions */ ++#define IiMustReadLock(i) do { \ ++ SiMustAnyLock((i)->i_sb); \ ++ RwMustReadLock(&itoii(i)->ii_rwsem); \ ++} while (0) ++ ++#define IiMustWriteLock(i) do { \ ++ SiMustAnyLock((i)->i_sb); \ ++ RwMustWriteLock(&itoii(i)->ii_rwsem); \ ++} while (0) ++ ++#define IiMustAnyLock(i) do { \ ++ SiMustAnyLock((i)->i_sb); \ ++ RwMustAnyLock(&itoii(i)->ii_rwsem); \ ++} while (0) ++ ++#define IiMustNoWaiters(i) RwMustNoWaiters(&itoii(i)->ii_rwsem) ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_INODE_H__ */ +diff --git a/fs/aufs/misc.c b/fs/aufs/misc.c +new file mode 100755 +index 0000000..32e0549 +--- /dev/null ++++ b/fs/aufs/misc.c +@@ -0,0 +1,228 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: misc.c,v 1.31 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++//#include <linux/namei.h> ++//#include <linux/mm.h> ++//#include <asm/uaccess.h> ++#include "aufs.h" ++ ++void *au_kzrealloc(void *p, unsigned int nused, unsigned int new_sz, gfp_t gfp) ++{ ++ void *q; ++ ++ LKTRTrace("p %p, nused %d, sz %d, ksize %d\n", ++ p, nused, new_sz, ksize(p)); ++ DEBUG_ON(new_sz <= 0); ++ if (new_sz <= nused) ++ return p; ++ if (new_sz <= ksize(p)) { ++ memset(p + nused, 0, new_sz - nused); ++ return p; ++ } ++ ++ q = kmalloc(new_sz, gfp); ++ //q = NULL; ++ if (unlikely(!q)) ++ return NULL; ++ memcpy(q, p, nused); ++ memset(q + nused, 0, new_sz - nused); ++ //smp_mb(); ++ kfree(p); ++ return q; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++// todo: make it inline ++struct nameidata *fake_dm(struct nameidata *fake_nd, struct nameidata *nd, ++ struct super_block *sb, aufs_bindex_t bindex) ++{ ++ LKTRTrace("nd %p, b%d\n", nd, bindex); ++ ++ if (!nd) ++ return NULL; ++ ++ fake_nd->dentry = NULL; ++ fake_nd->mnt = NULL; ++ ++#ifndef CONFIG_AUFS_FAKE_DM ++ DiMustAnyLock(nd->dentry); ++ ++ if (bindex <= dbend(nd->dentry)) ++ fake_nd->dentry = au_h_dptr_i(nd->dentry, bindex); ++ if (fake_nd->dentry) { ++ dget(fake_nd->dentry); ++ fake_nd->mnt = sbr_mnt(sb, bindex); ++ DEBUG_ON(!fake_nd->mnt); ++ mntget(fake_nd->mnt); ++ } else ++ fake_nd = ERR_PTR(-ENOENT); ++#endif ++ ++ TraceErrPtr(fake_nd); ++ return fake_nd; ++} ++ ++void fake_dm_release(struct nameidata *fake_nd) ++{ ++#ifndef CONFIG_AUFS_FAKE_DM ++ if (fake_nd) { ++ mntput(fake_nd->mnt); ++ dput(fake_nd->dentry); ++ } ++#endif ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++int au_copy_file(struct file *dst, struct file *src, loff_t len, ++ struct super_block *sb, int *sparse) ++{ ++ int err, all_zero, dlgt; ++ unsigned long blksize; ++ char *buf; ++ /* reduce stack space */ ++ struct iattr *ia; ++ ++ LKTRTrace("%.*s, %.*s\n", ++ DLNPair(dst->f_dentry), DLNPair(src->f_dentry)); ++ DEBUG_ON(!(dst->f_mode & FMODE_WRITE)); ++ IMustLock(dst->f_dentry->d_parent->d_inode); ++ ++ err = -ENOMEM; ++ blksize = dst->f_dentry->d_sb->s_blocksize; ++ if (!blksize || PAGE_SIZE < blksize) ++ blksize = PAGE_SIZE; ++ LKTRTrace("blksize %lu\n", blksize); ++ buf = kmalloc(blksize, GFP_KERNEL); ++ //buf = NULL; ++ if (unlikely(!buf)) ++ goto out; ++ ia = kmalloc(sizeof(*ia), GFP_KERNEL); ++ if (unlikely(!ia)) ++ goto out_buf; ++ ++ dlgt = need_dlgt(sb); ++ err = all_zero = 0; ++ dst->f_pos = src->f_pos = 0; ++ while (len) { ++ size_t sz, rbytes, wbytes, i; ++ char *p; ++ ++ LKTRTrace("len %lld\n", len); ++ sz = blksize; ++ if (len < blksize) ++ sz = len; ++ ++ /* support LSM and notify */ ++ rbytes = 0; ++ while (!rbytes || err == -EAGAIN || err == -EINTR) ++ err = rbytes = vfsub_read_k(src, buf, sz, &src->f_pos, ++ dlgt); ++ if (unlikely(err < 0)) ++ break; ++ ++ all_zero = 0; ++ if (len >= rbytes && rbytes == blksize) { ++ all_zero = 1; ++ p = buf; ++ for (i = 0; all_zero && i < rbytes; i++) ++ all_zero = !*p++; ++ } ++ if (!all_zero) { ++ wbytes = rbytes; ++ p = buf; ++ while (wbytes) { ++ size_t b; ++ /* support LSM and notify */ ++ err = b = vfsub_write_k(dst, p, wbytes, ++ &dst->f_pos, dlgt); ++ if (unlikely(err == -EAGAIN || err == -EINTR)) ++ continue; ++ if (unlikely(err < 0)) ++ break; ++ wbytes -= b; ++ p += b; ++ } ++ } else { ++ loff_t res; ++ LKTRLabel(hole); ++ *sparse = 1; ++ err = res = vfsub_llseek(dst, rbytes, SEEK_CUR); ++ if (unlikely(res < 0)) ++ break; ++ } ++ len -= rbytes; ++ err = 0; ++ } ++ ++ /* the last block may be a hole */ ++ if (unlikely(!err && all_zero)) { ++ struct dentry *h_d = dst->f_dentry; ++ struct inode *h_i = h_d->d_inode; ++ ++ LKTRLabel(last hole); ++ do { ++ err = vfsub_write_k(dst, "\0", 1, &dst->f_pos, dlgt); ++ } while (err == -EAGAIN || err == -EINTR); ++ if (err == 1) { ++ ia->ia_size = dst->f_pos; ++ ia->ia_valid = ATTR_SIZE | ATTR_FILE; ++ ia->ia_file = dst; ++ hi_lock_child2(h_i); ++ err = vfsub_notify_change(h_d, ia, dlgt); ++ i_unlock(h_i); ++ } ++ } ++ ++ kfree(ia); ++ out_buf: ++ kfree(buf); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++int test_ro(struct super_block *sb, aufs_bindex_t bindex, struct inode *inode) ++{ ++ int err; ++ ++ err = br_rdonly(stobr(sb, bindex)); ++ if (!err && inode) { ++ struct inode *hi = au_h_iptr_i(inode, bindex); ++ if (hi) ++ err = IS_IMMUTABLE(hi) ? -EROFS : 0; ++ } ++ return err; ++} ++ ++int au_test_perm(struct inode *hidden_inode, int mask, int dlgt) ++{ ++ if (!current->fsuid) ++ return 0; ++ if (unlikely(au_is_nfs(hidden_inode->i_sb) ++ && (mask & MAY_WRITE) ++ && S_ISDIR(hidden_inode->i_mode))) ++ mask |= MAY_READ; /* force permission check */ ++ return vfsub_permission(hidden_inode, mask, NULL, dlgt); ++} +diff --git a/fs/aufs/misc.h b/fs/aufs/misc.h +new file mode 100755 +index 0000000..fea4a2c +--- /dev/null ++++ b/fs/aufs/misc.h +@@ -0,0 +1,187 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: misc.h,v 1.25 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_MISC_H__ ++#define __AUFS_MISC_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/namei.h> ++#include <linux/sched.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++ ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,18) ++#define I_MUTEX_QUOTA 0 ++#define lockdep_off() /* */ ++#define lockdep_on() /* */ ++#define mutex_lock_nested(mtx, lsc) mutex_lock(mtx) ++#define down_write_nested(rw, lsc) down_write(rw) ++#define down_read_nested(rw, lsc) down_read(rw) ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct aufs_rwsem { ++ struct rw_semaphore rwsem; ++#ifdef CONFIG_AUFS_DEBUG ++ atomic_t rcnt; ++#endif ++}; ++ ++#ifdef CONFIG_AUFS_DEBUG ++#define DbgRcntInit(rw) atomic_set(&(rw)->rcnt, 0) ++#define DbgRcntInc(rw) atomic_inc(&(rw)->rcnt) ++#define DbgRcntDec(rw) WARN_ON(atomic_dec_return(&(rw)->rcnt) < 0) ++#else ++#define DbgRcntInit(rw) /* */ ++#define DbgRcntInc(rw) /* */ ++#define DbgRcntDec(rw) /* */ ++#endif ++ ++static inline void rw_init_nolock(struct aufs_rwsem *rw) ++{ ++ DbgRcntInit(rw); ++ init_rwsem(&rw->rwsem); ++} ++ ++static inline void rw_init_wlock(struct aufs_rwsem *rw) ++{ ++ rw_init_nolock(rw); ++ down_write(&rw->rwsem); ++} ++ ++static inline void rw_init_wlock_nested(struct aufs_rwsem *rw, unsigned int lsc) ++{ ++ rw_init_nolock(rw); ++ down_write_nested(&rw->rwsem, lsc); ++} ++ ++static inline void rw_read_lock(struct aufs_rwsem *rw) ++{ ++ down_read(&rw->rwsem); ++ DbgRcntInc(rw); ++} ++ ++static inline void rw_read_lock_nested(struct aufs_rwsem *rw, unsigned int lsc) ++{ ++ down_read_nested(&rw->rwsem, lsc); ++ DbgRcntInc(rw); ++} ++ ++static inline void rw_read_unlock(struct aufs_rwsem *rw) ++{ ++ DbgRcntDec(rw); ++ up_read(&rw->rwsem); ++} ++ ++static inline void rw_dgrade_lock(struct aufs_rwsem *rw) ++{ ++ DbgRcntInc(rw); ++ downgrade_write(&rw->rwsem); ++} ++ ++static inline void rw_write_lock(struct aufs_rwsem *rw) ++{ ++ down_write(&rw->rwsem); ++} ++ ++static inline void rw_write_lock_nested(struct aufs_rwsem *rw, unsigned int lsc) ++{ ++ down_write_nested(&rw->rwsem, lsc); ++} ++ ++static inline void rw_write_unlock(struct aufs_rwsem *rw) ++{ ++ up_write(&rw->rwsem); ++} ++ ++#if 0 // why is not _nested version defined ++static inline int rw_read_trylock(struct aufs_rwsem *rw) ++{ ++ int ret = down_read_trylock(&rw->rwsem); ++ if (ret) ++ DbgRcntInc(rw); ++ return ret; ++} ++ ++static inline int rw_write_trylock(struct aufs_rwsem *rw) ++{ ++ return down_write_trylock(&rw->rwsem); ++} ++#endif ++ ++#undef DbgRcntInit ++#undef DbgRcntInc ++#undef DbgRcntDec ++ ++/* to debug easier, do not make them inlined functions */ ++#define RwMustNoWaiters(rw) DEBUG_ON(!list_empty(&(rw)->rwsem.wait_list)) ++#define RwMustAnyLock(rw) DEBUG_ON(down_write_trylock(&(rw)->rwsem)) ++#ifdef CONFIG_AUFS_DEBUG ++#define RwMustReadLock(rw) do { \ ++ RwMustAnyLock(rw); \ ++ DEBUG_ON(!atomic_read(&(rw)->rcnt)); \ ++} while (0) ++#define RwMustWriteLock(rw) do { \ ++ RwMustAnyLock(rw); \ ++ DEBUG_ON(atomic_read(&(rw)->rcnt)); \ ++} while (0) ++#else ++#define RwMustReadLock(rw) RwMustAnyLock(rw) ++#define RwMustWriteLock(rw) RwMustAnyLock(rw) ++#endif ++ ++#define SimpleLockRwsemFuncs(prefix, param, rwsem) \ ++static inline void prefix##_read_lock(param) {rw_read_lock(&(rwsem));} \ ++static inline void prefix##_write_lock(param) {rw_write_lock(&(rwsem));} ++//static inline void prefix##_read_trylock(param) {rw_read_trylock(&(rwsem));} ++//static inline void prefix##_write_trylock(param) {rw_write_trylock(&(rwsem));} ++//static inline void prefix##_read_trylock_nested(param, lsc) ++//{rw_read_trylock_nested(&(rwsem, lsc));} ++//static inline void prefix##_write_trylock_nestd(param, lsc) ++//{rw_write_trylock_nested(&(rwsem), nested);} ++ ++#define SimpleUnlockRwsemFuncs(prefix, param, rwsem) \ ++static inline void prefix##_read_unlock(param) {rw_read_unlock(&(rwsem));} \ ++static inline void prefix##_write_unlock(param) {rw_write_unlock(&(rwsem));} \ ++static inline void prefix##_downgrade_lock(param) {rw_dgrade_lock(&(rwsem));} ++ ++#define SimpleRwsemFuncs(prefix, param, rwsem) \ ++ SimpleLockRwsemFuncs(prefix, param, rwsem); \ ++ SimpleUnlockRwsemFuncs(prefix, param, rwsem) ++ ++/* ---------------------------------------------------------------------- */ ++ ++typedef ssize_t (*readf_t)(struct file*, char __user*, size_t, loff_t*); ++typedef ssize_t (*writef_t)(struct file*, const char __user*, size_t, loff_t*); ++ ++void *au_kzrealloc(void *p, unsigned int nused, unsigned int new_sz, gfp_t gfp); ++struct nameidata *fake_dm(struct nameidata *fake_nd, struct nameidata *nd, ++ struct super_block *sb, aufs_bindex_t bindex); ++void fake_dm_release(struct nameidata *fake_nd); ++int au_copy_file(struct file *dst, struct file *src, loff_t len, ++ struct super_block *sb, int *sparse); ++int test_ro(struct super_block *sb, aufs_bindex_t bindex, struct inode *inode); ++int au_test_perm(struct inode *h_inode, int mask, int dlgt); ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_MISC_H__ */ +diff --git a/fs/aufs/module.c b/fs/aufs/module.c +new file mode 100755 +index 0000000..06c563e +--- /dev/null ++++ b/fs/aufs/module.c +@@ -0,0 +1,334 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: module.c,v 1.9 2007/04/30 05:46:32 sfjro Exp $ */ ++ ++//#include <linux/init.h> ++//#include <linux/kobject.h> ++#include <linux/module.h> ++//#include <linux/seq_file.h> ++//#include <linux/sysfs.h> ++#include "aufs.h" ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * aufs caches ++ */ ++struct kmem_cache *aufs_cachep[AuCache_Last]; ++static int __init create_cache(void) ++{ ++#define Cache(type) kmem_cache_create(#type, sizeof(struct type), 0, \ ++ SLAB_RECLAIM_ACCOUNT, NULL, NULL) ++ ++ if ((aufs_cachep[AuCache_DINFO] = Cache(aufs_dinfo)) ++ && (aufs_cachep[AuCache_ICNTNR] = Cache(aufs_icntnr)) ++ && (aufs_cachep[AuCache_FINFO] = Cache(aufs_finfo)) ++ //&& (aufs_cachep[AuCache_FINFO] = NULL) ++ && (aufs_cachep[AuCache_VDIR] = Cache(aufs_vdir)) ++ && (aufs_cachep[AuCache_DEHSTR] = Cache(aufs_dehstr)) ++ && (aufs_cachep[AuCache_HINOTIFY] = Cache(aufs_hinotify))) ++ return 0; ++ return -ENOMEM; ++ ++#undef Cache ++} ++ ++static void destroy_cache(void) ++{ ++ int i; ++ for (i = 0; i < AuCache_Last; i++) ++ if (aufs_cachep[i]) ++ kmem_cache_destroy(aufs_cachep[i]); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++char au_esc_chars[0x20 + 3]; /* 0x01-0x20, backslash, del, and NULL */ ++int au_dir_roflags; ++extern struct file_system_type aufs_fs_type; ++ ++#ifdef DbgDlgt ++#include <linux/security.h> ++#include "dbg_dlgt.c" ++#else ++#define dbg_dlgt_init() 0 ++#define dbg_dlgt_fin() /* */ ++#endif ++ ++/* ++ * functions for module interface. ++ */ ++MODULE_LICENSE("GPL"); ++MODULE_AUTHOR("Junjiro Okajima"); ++MODULE_DESCRIPTION(AUFS_NAME " -- Another unionfs"); ++MODULE_VERSION(AUFS_VERSION); ++ ++/* it should be 'byte', but param_set_byte() prints by "%c" */ ++short aufs_nwkq = AUFS_NWKQ_DEF; ++MODULE_PARM_DESC(nwkq, "the number of workqueue thread, " AUFS_WKQ_NAME); ++module_param_named(nwkq, aufs_nwkq, short, 0444); ++ ++int sysaufs_brs = 0; ++MODULE_PARM_DESC(brs, "use <sysfs>/fs/aufs/brs"); ++module_param_named(brs, sysaufs_brs, int, 0444); ++ ++static int __init aufs_init(void) ++{ ++ int err, i; ++ char *p; ++ ++ //sbinfo->si_xino is atomic_long_t ++ BUILD_BUG_ON(sizeof(ino_t) != sizeof(long)); ++ ++#ifdef CONFIG_AUFS_DEBUG ++ { ++ struct aufs_destr destr; ++ destr.len = -1; ++ DEBUG_ON(destr.len < NAME_MAX); ++ } ++ ++#ifdef CONFIG_4KSTACKS ++ printk("CONFIG_4KSTACKS is defined.\n"); ++#endif ++#if 0 // verbose debug ++ { ++ union { ++ struct aufs_branch *br; ++ struct aufs_dinfo *di; ++ struct aufs_finfo *fi; ++ struct aufs_iinfo *ii; ++ struct aufs_hinode *hi; ++ struct aufs_sbinfo *si; ++ struct aufs_destr *destr; ++ struct aufs_de *de; ++ struct aufs_wh *wh; ++ struct aufs_vdir *vd; ++ } u; ++ ++ printk("br{" ++ "xino %d, readf %d, writef %d, " ++ "id %d, perm %d, mnt %d, count %d, " ++ "wh_sem %d, wh %d, run %d} %d\n", ++ offsetof(typeof(*u.br), br_xino), ++ offsetof(typeof(*u.br), br_xino_read), ++ offsetof(typeof(*u.br), br_xino_write), ++ offsetof(typeof(*u.br), br_id), ++ offsetof(typeof(*u.br), br_perm), ++ offsetof(typeof(*u.br), br_mnt), ++ offsetof(typeof(*u.br), br_count), ++ offsetof(typeof(*u.br), br_wh_rwsem), ++ offsetof(typeof(*u.br), br_wh), ++ offsetof(typeof(*u.br), br_wh_running), ++ sizeof(*u.br)); ++ printk("di{gen %d, rwsem %d, bstart %d, bend %d, bwh %d, " ++ "bdiropq %d, hdentry %d, reval %d} %d\n", ++ offsetof(typeof(*u.di), di_generation), ++ offsetof(typeof(*u.di), di_rwsem), ++ offsetof(typeof(*u.di), di_bstart), ++ offsetof(typeof(*u.di), di_bend), ++ offsetof(typeof(*u.di), di_bwh), ++ offsetof(typeof(*u.di), di_bdiropq), ++ offsetof(typeof(*u.di), di_hdentry), ++ offsetof(typeof(*u.di), di_reval), ++ sizeof(*u.di)); ++ printk("fi{gen %d, rwsem %d, hfile %d, bstart %d, bend %d, " ++ "h_vm_ops %d, vdir_cach %d} %d\n", ++ offsetof(typeof(*u.fi), fi_generation), ++ offsetof(typeof(*u.fi), fi_rwsem), ++ offsetof(typeof(*u.fi), fi_hfile), ++ offsetof(typeof(*u.fi), fi_bstart), ++ offsetof(typeof(*u.fi), fi_bend), ++ offsetof(typeof(*u.fi), fi_h_vm_ops), ++ offsetof(typeof(*u.fi), fi_vdir_cache), ++ sizeof(*u.fi)); ++ printk("ii{rwsem %d, bstart %d, bend %d, hinode %d, vdir %d} " ++ "%d\n", ++ offsetof(typeof(*u.ii), ii_rwsem), ++ offsetof(typeof(*u.ii), ii_bstart), ++ offsetof(typeof(*u.ii), ii_bend), ++ offsetof(typeof(*u.ii), ii_hinode), ++ offsetof(typeof(*u.ii), ii_vdir), ++ sizeof(*u.ii)); ++ printk("hi{inode %d, id %d, notify %d} %d\n", ++ offsetof(typeof(*u.hi), hi_inode), ++ offsetof(typeof(*u.hi), hi_id), ++ offsetof(typeof(*u.hi), hi_notify), ++ sizeof(*u.hi)); ++ printk("si{rwsem %d, gen %d, " ++ "failed_refresh %d, " ++ "bend %d, last id %d, br %d, " ++ "flags %d, " ++ "xino %d, " ++ "rdcache %d, " ++ "dirwh %d, " ++ "pl_lock %d, pl %d, " ++ "kobj %d} %d\n", ++ offsetof(typeof(*u.si), si_rwsem), ++ offsetof(typeof(*u.si), si_generation), ++ -1,//offsetof(typeof(*u.si), si_failed_refresh_dirs), ++ offsetof(typeof(*u.si), si_bend), ++ offsetof(typeof(*u.si), si_last_br_id), ++ offsetof(typeof(*u.si), si_branch), ++ offsetof(typeof(*u.si), si_flags), ++ offsetof(typeof(*u.si), si_xino), ++ offsetof(typeof(*u.si), si_rdcache), ++ offsetof(typeof(*u.si), si_dirwh), ++ offsetof(typeof(*u.si), si_plink_lock), ++ offsetof(typeof(*u.si), si_plink), ++ offsetof(typeof(*u.si), si_kobj), ++ sizeof(*u.si)); ++ printk("destr{len %d, name %d} %d\n", ++ offsetof(typeof(*u.destr), len), ++ offsetof(typeof(*u.destr), name), ++ sizeof(*u.destr)); ++ printk("de{ino %d, type %d, str %d} %d\n", ++ offsetof(typeof(*u.de), de_ino), ++ offsetof(typeof(*u.de), de_type), ++ offsetof(typeof(*u.de), de_str), ++ sizeof(*u.de)); ++ printk("wh{hash %d, bindex %d, str %d} %d\n", ++ offsetof(typeof(*u.wh), wh_hash), ++ offsetof(typeof(*u.wh), wh_bindex), ++ offsetof(typeof(*u.wh), wh_str), ++ sizeof(*u.wh)); ++ printk("vd{deblk %d, nblk %d, last %d, ver %d, jiffy %d} %d\n", ++ offsetof(typeof(*u.vd), vd_deblk), ++ offsetof(typeof(*u.vd), vd_nblk), ++ offsetof(typeof(*u.vd), vd_last), ++ offsetof(typeof(*u.vd), vd_version), ++ offsetof(typeof(*u.vd), vd_jiffy), ++ sizeof(*u.vd)); ++ } ++#endif ++#endif ++ ++ p = au_esc_chars; ++ for (i = 1; i <= ' '; i++) ++ *p++ = i; ++ *p++ = '\\'; ++ *p++ = '\x7f'; ++ *p = 0; ++ ++ au_dir_roflags = au_file_roflags(O_DIRECTORY | O_LARGEFILE); ++#ifndef CONFIG_AUFS_SYSAUFS ++ sysaufs_brs = 0; ++#endif ++ ++ err = -EINVAL; ++ if (unlikely(aufs_nwkq <= 0)) ++ goto out; ++ err = create_cache(); ++ if (unlikely(err)) ++ goto out; ++ err = sysaufs_init(); ++ if (unlikely(err)) ++ goto out_cache; ++ err = au_wkq_init(); ++ if (unlikely(err)) ++ goto out_kobj; ++ err = au_inotify_init(); ++ if (unlikely(err)) ++ goto out_wkq; ++ err = dbg_dlgt_init(); ++ if (unlikely(err)) ++ goto out_inotify; ++ err = register_filesystem(&aufs_fs_type); ++ if (unlikely(err)) ++ goto out_dlgt; ++ printk(AUFS_NAME " " AUFS_VERSION "\n"); ++ return 0; /* success */ ++ ++ out_dlgt: ++ dbg_dlgt_fin(); ++ out_inotify: ++ au_inotify_fin(); ++ out_wkq: ++ au_wkq_fin(); ++ out_kobj: ++ sysaufs_fin(); ++ out_cache: ++ destroy_cache(); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static void __exit aufs_exit(void) ++{ ++ unregister_filesystem(&aufs_fs_type); ++ dbg_dlgt_fin(); ++ au_inotify_fin(); ++ au_wkq_fin(); ++ sysaufs_fin(); ++ destroy_cache(); ++} ++ ++module_init(aufs_init); ++module_exit(aufs_exit); ++ ++/* ---------------------------------------------------------------------- */ ++ ++// fake Kconfig ++#if 1 ++#ifdef CONFIG_AUFS_HINOTIFY ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,18) ++#error CONFIG_AUFS_HINOTIFY is supported in linux-2.6.18 and later. ++#endif ++#ifndef CONFIG_INOTIFY ++#error enable CONFIG_INOTIFY to use CONFIG_AUFS_HINOTIFY. ++#endif ++#endif ++ ++#if AUFS_BRANCH_MAX > 511 && BITS_PER_LONG == 64 && PAGE_SIZE == 4096 ++#warning For 4k pagesize and 64bit environment, \ ++ CONFIG_AUFS_BRANCH_MAX_511 or smaller is recommended. ++#endif ++ ++#ifdef CONFIG_AUFS_SYSAUFS ++#ifndef CONFIG_SYSFS ++#error CONFIG_AUFS_SYSAUFS requires CONFIG_SYSFS. ++#endif ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,18) ++#error CONFIG_AUFS_SYSAUFS requires linux-2.6.18 and later. ++#endif ++#endif ++ ++#ifdef CONFIG_AUFS_EXPORT ++#if !defined(CONFIG_EXPORTFS) && !defined(CONFIG_EXPORTFS_MODULE) ++#error CONFIG_AUFS_EXPORT requires CONFIG_EXPORTFS ++#endif ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,18) ++#error CONFIG_AUFS_EXPORT requires linux-2.6.18 and later. ++#endif ++#if defined(CONFIG_EXPORTFS_MODULE) && defined(CONFIG_AUFS) ++#error need CONFIG_EXPORTFS=y to link aufs statically with CONFIG_AUFS_EXPORT ++#endif ++#endif ++ ++#ifdef CONFIG_DEBUG_PROVE_LOCKING ++#if MAX_LOCKDEP_SUBCLASSES < AuLsc_End ++#warning lockdep will not work since aufs uses deeper locks. ++#endif ++#endif ++ ++#ifdef CONFIG_AUFS_COMPAT ++#warning CONFIG_AUFS_COMPAT will be removed in the near future. ++#endif ++ ++#endif +diff --git a/fs/aufs/module.h b/fs/aufs/module.h +new file mode 100755 +index 0000000..3769861 +--- /dev/null ++++ b/fs/aufs/module.h +@@ -0,0 +1,60 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: module.h,v 1.8 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_MODULE_H__ ++#define __AUFS_MODULE_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/slab.h> ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* module parameters */ ++extern short aufs_nwkq; ++extern int sysaufs_brs; ++ ++/* ---------------------------------------------------------------------- */ ++ ++extern char au_esc_chars[]; ++extern int au_dir_roflags; ++ ++/* kmem cache */ ++enum {AuCache_DINFO, AuCache_ICNTNR, AuCache_FINFO, AuCache_VDIR, ++ AuCache_DEHSTR, AuCache_HINOTIFY, AuCache_Last}; ++extern struct kmem_cache *aufs_cachep[]; ++ ++#define CacheFuncs(name, index) \ ++static inline void *cache_alloc_##name(void) \ ++{return kmem_cache_alloc(aufs_cachep[index], GFP_KERNEL);} \ ++static inline void cache_free_##name(void *p) \ ++{kmem_cache_free(aufs_cachep[index], p);} ++ ++CacheFuncs(dinfo, AuCache_DINFO); ++CacheFuncs(icntnr, AuCache_ICNTNR); ++CacheFuncs(finfo, AuCache_FINFO); ++CacheFuncs(vdir, AuCache_VDIR); ++CacheFuncs(dehstr, AuCache_DEHSTR); ++CacheFuncs(hinotify, AuCache_HINOTIFY); ++ ++#undef CacheFuncs ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_MODULE_H__ */ +diff --git a/fs/aufs/opts.c b/fs/aufs/opts.c +new file mode 100755 +index 0000000..c1a9445 +--- /dev/null ++++ b/fs/aufs/opts.c +@@ -0,0 +1,1043 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: opts.c,v 1.34 2007/05/14 03:40:27 sfjro Exp $ */ ++ ++#include <asm/types.h> // a distribution requires ++#include <linux/parser.h> ++#include "aufs.h" ++ ++enum { ++ Opt_br, ++ Opt_add, Opt_del, Opt_mod, Opt_append, Opt_prepend, ++ Opt_idel, Opt_imod, ++ Opt_dirwh, Opt_rdcache, Opt_deblk, Opt_nhash, ++ Opt_xino, Opt_zxino, Opt_noxino, ++ Opt_plink, Opt_noplink, Opt_list_plink, Opt_clean_plink, ++ Opt_udba, ++ Opt_diropq_a, Opt_diropq_w, ++ Opt_warn_perm, Opt_nowarn_perm, ++ Opt_findrw_dir, Opt_findrw_br, ++ Opt_coo, ++ Opt_dlgt, Opt_nodlgt, ++ Opt_tail, Opt_ignore, Opt_err ++}; ++ ++static match_table_t options = { ++ {Opt_br, "br=%s"}, ++ {Opt_br, "br:%s"}, ++ ++ {Opt_add, "add=%d:%s"}, ++ {Opt_add, "add:%d:%s"}, ++ {Opt_add, "ins=%d:%s"}, ++ {Opt_add, "ins:%d:%s"}, ++ {Opt_append, "append=%s"}, ++ {Opt_append, "append:%s"}, ++ {Opt_prepend, "prepend=%s"}, ++ {Opt_prepend, "prepend:%s"}, ++ ++ {Opt_del, "del=%s"}, ++ {Opt_del, "del:%s"}, ++ //{Opt_idel, "idel:%d"}, ++ {Opt_mod, "mod=%s"}, ++ {Opt_mod, "mod:%s"}, ++ //{Opt_imod, "imod:%d:%s"}, ++ ++ {Opt_dirwh, "dirwh=%d"}, ++ {Opt_dirwh, "dirwh:%d"}, ++ ++ {Opt_xino, "xino=%s"}, ++ {Opt_xino, "xino:%s"}, ++ {Opt_noxino, "noxino"}, ++ //{Opt_zxino, "zxino=%s"}, ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,16) ++ {Opt_plink, "plink"}, ++ {Opt_noplink, "noplink"}, ++#ifdef CONFIG_AUFS_DEBUG ++ {Opt_list_plink, "list_plink"}, ++#endif ++ {Opt_clean_plink, "clean_plink"}, ++#endif ++ ++ {Opt_udba, "udba=%s"}, ++ ++ {Opt_diropq_a, "diropq=always"}, ++ {Opt_diropq_a, "diropq=a"}, ++ {Opt_diropq_w, "diropq=whiteouted"}, ++ {Opt_diropq_w, "diropq=w"}, ++ ++ {Opt_warn_perm, "warn_perm"}, ++ {Opt_nowarn_perm, "nowarn_perm"}, ++ ++#ifdef CONFIG_AUFS_DLGT ++ {Opt_dlgt, "dlgt"}, ++ {Opt_nodlgt, "nodlgt"}, ++#endif ++ ++ {Opt_rdcache, "rdcache=%d"}, ++ {Opt_rdcache, "rdcache:%d"}, ++#if 0 ++ {Opt_findrw_dir, "findrw=dir"}, ++ {Opt_findrw_br, "findrw=br"}, ++ ++ {Opt_coo, "coo=%s"}, ++ ++ {Opt_deblk, "deblk=%d"}, ++ {Opt_deblk, "deblk:%d"}, ++ {Opt_nhash, "nhash=%d"}, ++ {Opt_nhash, "nhash:%d"}, ++#endif ++ ++ {Opt_br, "dirs=%s"}, ++ {Opt_ignore, "debug=%d"}, ++ {Opt_ignore, "delete=whiteout"}, ++ {Opt_ignore, "delete=all"}, ++ {Opt_ignore, "imap=%s"}, ++ ++ {Opt_err, NULL} ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++#define RW "rw" ++#define RO "ro" ++#define WH "wh" ++#define RR "rr" ++#define NoLinkWH "nolwh" ++ ++static match_table_t brperms = { ++ {AuBr_RR, RR}, ++ {AuBr_RO, RO}, ++ {AuBr_RW, RW}, ++ ++ {AuBr_RRWH, RR "+" WH}, ++ {AuBr_ROWH, RO "+" WH}, ++ {AuBr_RWNoLinkWH, RW "+" NoLinkWH}, ++ ++ {AuBr_ROWH, "nfsro"}, ++ {AuBr_RO, NULL} ++}; ++ ++static int br_perm_val(char *perm) ++{ ++ int val; ++ substring_t args[MAX_OPT_ARGS]; ++ ++ DEBUG_ON(!perm || !*perm); ++ LKTRTrace("perm %s\n", perm); ++ val = match_token(perm, brperms, args); ++ TraceErr(val); ++ return val; ++} ++ ++int br_perm_str(char *p, unsigned int len, int brperm) ++{ ++ struct match_token *bp = brperms; ++ ++ LKTRTrace("len %d, 0x%x\n", len, brperm); ++ ++ while (bp->pattern) { ++ if (bp->token == brperm) { ++ if (strlen(bp->pattern) < len) { ++ strcpy(p, bp->pattern); ++ return 0; ++ } else ++ return -E2BIG; ++ } ++ bp++; ++ } ++ ++ return -EIO; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static match_table_t udbalevel = { ++ {AuFlag_UDBA_REVAL, "reval"}, ++#ifdef CONFIG_AUFS_HINOTIFY ++ {AuFlag_UDBA_INOTIFY, "inotify"}, ++#endif ++ {AuFlag_UDBA_NONE, "none"}, ++ {-1, NULL} ++}; ++ ++static int udba_val(char *str) ++{ ++ substring_t args[MAX_OPT_ARGS]; ++ return match_token(str, udbalevel, args); ++} ++ ++au_parser_pattern_t udba_str(int udba) ++{ ++ struct match_token *p = udbalevel; ++ while (p->pattern) { ++ if (p->token == udba) ++ return p->pattern; ++ p++; ++ } ++ BUG(); ++ return "??"; ++} ++ ++void udba_set(struct super_block *sb, unsigned int flg) ++{ ++ au_flag_clr(sb, AuMask_UDBA); ++ au_flag_set(sb, flg); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static match_table_t coolevel = { ++ {AuFlag_COO_LEAF, "leaf"}, ++ {AuFlag_COO_ALL, "all"}, ++ {AuFlag_COO_NONE, "none"}, ++ {-1, NULL} ++}; ++ ++#if 0 ++static int coo_val(char *str) ++{ ++ substring_t args[MAX_OPT_ARGS]; ++ return match_token(str, coolevel, args); ++} ++#endif ++ ++au_parser_pattern_t coo_str(int coo) ++{ ++ struct match_token *p = coolevel; ++ while (p->pattern) { ++ if (p->token == coo) ++ return p->pattern; ++ p++; ++ } ++ BUG(); ++ return "??"; ++} ++static void coo_set(struct super_block *sb, unsigned int flg) ++{ ++ au_flag_clr(sb, AuMask_COO); ++ au_flag_set(sb, flg); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static const int lkup_dirflags = LOOKUP_FOLLOW | LOOKUP_DIRECTORY; ++ ++#ifdef CONFIG_AUFS_DEBUG ++static void dump_opts(struct opts *opts) ++{ ++ /* reduce stack space */ ++ union { ++ struct opt_add *add; ++ struct opt_del *del; ++ struct opt_mod *mod; ++ struct opt_xino *xino; ++ } u; ++ struct opt *opt; ++ ++ TraceEnter(); ++ ++ opt = opts->opt; ++ while (/* opt < opts_tail && */ opt->type != Opt_tail) { ++ switch (opt->type) { ++ case Opt_add: ++ u.add = &opt->add; ++ LKTRTrace("add {b%d, %s, 0x%x, %p}\n", ++ u.add->bindex, u.add->path, u.add->perm, ++ u.add->nd.dentry); ++ break; ++ case Opt_del: ++ case Opt_idel: ++ u.del = &opt->del; ++ LKTRTrace("del {%s, %p}\n", u.del->path, u.del->h_root); ++ break; ++ case Opt_mod: ++ case Opt_imod: ++ u.mod = &opt->mod; ++ LKTRTrace("mod {%s, 0x%x, %p}\n", ++ u.mod->path, u.mod->perm, u.mod->h_root); ++ break; ++ case Opt_append: ++ u.add = &opt->add; ++ LKTRTrace("append {b%d, %s, 0x%x, %p}\n", ++ u.add->bindex, u.add->path, u.add->perm, ++ u.add->nd.dentry); ++ break; ++ case Opt_prepend: ++ u.add = &opt->add; ++ LKTRTrace("prepend {b%d, %s, 0x%x, %p}\n", ++ u.add->bindex, u.add->path, u.add->perm, ++ u.add->nd.dentry); ++ break; ++ case Opt_dirwh: ++ LKTRTrace("dirwh %d\n", opt->dirwh); ++ break; ++ case Opt_rdcache: ++ LKTRTrace("rdcache %d\n", opt->rdcache); ++ break; ++ case Opt_xino: ++ u.xino = &opt->xino; ++ LKTRTrace("xino {%s %.*s}\n", ++ u.xino->path, DLNPair(u.xino->file->f_dentry)); ++ break; ++ case Opt_noxino: ++ LKTRLabel(noxino); ++ break; ++ case Opt_plink: ++ LKTRLabel(plink); ++ break; ++ case Opt_noplink: ++ LKTRLabel(noplink); ++ break; ++ case Opt_list_plink: ++ LKTRLabel(list_plink); ++ break; ++ case Opt_clean_plink: ++ LKTRLabel(clean_plink); ++ break; ++ case Opt_udba: ++ LKTRTrace("udba %d, %s\n", ++ opt->udba, udba_str(opt->udba)); ++ break; ++ case Opt_diropq_a: ++ LKTRLabel(diropq_a); ++ break; ++ case Opt_diropq_w: ++ LKTRLabel(diropq_w); ++ break; ++ case Opt_warn_perm: ++ LKTRLabel(warn_perm); ++ break; ++ case Opt_nowarn_perm: ++ LKTRLabel(nowarn_perm); ++ break; ++ case Opt_dlgt: ++ LKTRLabel(dlgt); ++ break; ++ case Opt_nodlgt: ++ LKTRLabel(nodlgt); ++ break; ++ case Opt_coo: ++ LKTRTrace("coo %d, %s\n", opt->coo, coo_str(opt->coo)); ++ break; ++ default: ++ BUG(); ++ } ++ opt++; ++ } ++} ++#else ++#define dump_opts(opts) /* */ ++#endif ++ ++void au_free_opts(struct opts *opts) ++{ ++ struct opt *opt; ++ ++ TraceEnter(); ++ ++ opt = opts->opt; ++ while (opt->type != Opt_tail) { ++ switch (opt->type) { ++ case Opt_add: ++ case Opt_append: ++ case Opt_prepend: ++ path_release(&opt->add.nd); ++ break; ++ case Opt_del: ++ case Opt_idel: ++ dput(opt->del.h_root); ++ break; ++ case Opt_mod: ++ case Opt_imod: ++ dput(opt->mod.h_root); ++ break; ++ case Opt_xino: ++ fput(opt->xino.file); ++ break; ++ } ++ opt++; ++ } ++} ++ ++static int opt_add(struct opt *opt, char *opt_str, struct super_block *sb, ++ aufs_bindex_t bindex) ++{ ++ int err; ++ struct opt_add *add = &opt->add; ++ char *p; ++ ++ LKTRTrace("%s, b%d\n", opt_str, bindex); ++ ++ add->bindex = bindex; ++ add->perm = AuBr_RO; ++ if (!bindex && !(sb->s_flags & MS_RDONLY)) ++ add->perm = AuBr_RW; ++#ifdef CONFIG_AUFS_COMPAT ++ add->perm = AuBr_RW; ++#endif ++ add->path = opt_str; ++ p = strchr(opt_str, '='); ++ if (unlikely(p)) { ++ *p++ = 0; ++ if (*p) ++ add->perm = br_perm_val(p); ++ } ++ ++ // LSM may detect it ++ // do not superio. ++ err = path_lookup(add->path, lkup_dirflags, &add->nd); ++ //err = -1; ++ if (!err) { ++ opt->type = Opt_add; ++ goto out; ++ } ++ Err("lookup failed %s (%d)\n", add->path, err); ++ err = -EINVAL; ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* called without aufs lock */ ++int au_parse_opts(struct super_block *sb, char *str, struct opts *opts) ++{ ++ int err, n; ++ struct dentry *root; ++ struct opt *opt, *opt_tail; ++ char *opt_str; ++ substring_t args[MAX_OPT_ARGS]; ++ aufs_bindex_t bindex; ++ struct nameidata nd; ++ /* reduce stack space */ ++ union { ++ struct opt_del *del; ++ struct opt_mod *mod; ++ struct opt_xino *xino; ++ } u; ++ struct file *file; ++ ++ LKTRTrace("%s, nopts %d\n", str, opts->max_opt); ++ ++ root = sb->s_root; ++ err = 0; ++ bindex = 0; ++ opt = opts->opt; ++ opt_tail = opt + opts->max_opt - 1; ++ opt->type = Opt_tail; ++ while (!err && (opt_str = strsep(&str, ",")) && *opt_str) { ++ int token, skipped; ++ char *p; ++ err = -EINVAL; ++ token = match_token(opt_str, options, args); ++ LKTRTrace("%s, token %d, args[0]{%p, %p}\n", ++ opt_str, token, args[0].from, args[0].to); ++ ++ skipped = 0; ++ switch (token) { ++ case Opt_br: ++ err = 0; ++ while (!err && (opt_str = strsep(&args[0].from, ":")) ++ && *opt_str) { ++ err = opt_add(opt, opt_str, sb, bindex++); ++ //if (LktrCond) err = -1; ++ if (unlikely(!err && ++opt > opt_tail)) { ++ err = -E2BIG; ++ break; ++ } ++ opt->type = Opt_tail; ++ skipped = 1; ++ } ++ break; ++ case Opt_add: ++ if (unlikely(match_int(&args[0], &n))) { ++ Err("bad integer in %s\n", opt_str); ++ break; ++ } ++ bindex = n; ++ err = opt_add(opt, args[1].from, sb, bindex); ++ break; ++ case Opt_append: ++ case Opt_prepend: ++ err = opt_add(opt, args[0].from, sb, /*dummy bindex*/1); ++ if (!err) ++ opt->type = token; ++ break; ++ case Opt_del: ++ u.del = &opt->del; ++ u.del->path = args[0].from; ++ LKTRTrace("del path %s\n", u.del->path); ++ // LSM may detect it ++ // do not superio. ++ err = path_lookup(u.del->path, lkup_dirflags, &nd); ++ if (unlikely(err)) { ++ Err("lookup failed %s (%d)\n", u.del->path, err); ++ break; ++ } ++ u.del->h_root = dget(nd.dentry); ++ path_release(&nd); ++ opt->type = token; ++ break; ++#if 0 ++ case Opt_idel: ++ u.del = &opt->del; ++ u.del->path = "(indexed)"; ++ if (unlikely(match_int(&args[0], &n))) { ++ Err("bad integer in %s\n", opt_str); ++ break; ++ } ++ bindex = n; ++ aufs_read_lock(root, !AUFS_I_RLOCK); ++ if (bindex < 0 || sbend(sb) < bindex) { ++ Err("out of bounds, %d\n", bindex); ++ aufs_read_unlock(root, !AUFS_I_RLOCK); ++ break; ++ } ++ err = 0; ++ u.del->h_root = dget(au_h_dptr_i(root, bindex)); ++ opt->type = token; ++ aufs_read_unlock(root, !AUFS_I_RLOCK); ++ break; ++#endif ++ ++ case Opt_mod: ++ u.mod = &opt->mod; ++ u.mod->path = args[0].from; ++ p = strchr(u.mod->path, '='); ++ if (unlikely(!p)) { ++ Err("no permssion %s\n", opt_str); ++ break; ++ } ++ *p++ = 0; ++ u.mod->perm = br_perm_val(p); ++ LKTRTrace("mod path %s, perm 0x%x, %s\n", ++ u.mod->path, u.mod->perm, p); ++ // LSM may detect it ++ // do not superio. ++ err = path_lookup(u.mod->path, lkup_dirflags, &nd); ++ if (unlikely(err)) { ++ Err("lookup failed %s (%d)\n", u.mod->path, err); ++ break; ++ } ++ u.mod->h_root = dget(nd.dentry); ++ path_release(&nd); ++ opt->type = token; ++ break; ++#if 0 ++ case Opt_imod: ++ u.mod = &opt->mod; ++ u.mod->path = "(indexed)"; ++ if (unlikely(match_int(&args[0], &n))) { ++ Err("bad integer in %s\n", opt_str); ++ break; ++ } ++ bindex = n; ++ aufs_read_lock(root, !AUFS_I_RLOCK); ++ if (bindex < 0 || sbend(sb) < bindex) { ++ Err("out of bounds, %d\n", bindex); ++ aufs_read_unlock(root, !AUFS_I_RLOCK); ++ break; ++ } ++ u.mod->perm = br_perm_val(args[1].from); ++ LKTRTrace("mod path %s, perm 0x%x, %s\n", ++ u.mod->path, u.mod->perm, args[1].from); ++ err = 0; ++ u.mod->h_root = dget(au_h_dptr_i(root, bindex)); ++ opt->type = token; ++ aufs_read_unlock(root, !AUFS_I_RLOCK); ++ break; ++#endif ++ case Opt_xino: ++ u.xino = &opt->xino; ++ file = xino_create(sb, args[0].from, /*silent*/0, ++ /*parent*/NULL); ++ err = PTR_ERR(file); ++ if (IS_ERR(file)) ++ break; ++ err = -EINVAL; ++ if (unlikely(file->f_dentry->d_sb == sb)) { ++ fput(file); ++ Err("%s must be outside\n", args[0].from); ++ break; ++ } ++ err = 0; ++ u.xino->file = file; ++ u.xino->path = args[0].from; ++ opt->type = token; ++ break; ++ ++ case Opt_dirwh: ++ if (unlikely(match_int(&args[0], &opt->dirwh))) ++ break; ++ err = 0; ++ opt->type = token; ++ break; ++ ++ case Opt_rdcache: ++ if (unlikely(match_int(&args[0], &opt->rdcache))) ++ break; ++ err = 0; ++ opt->type = token; ++ break; ++ ++ case Opt_noxino: ++ case Opt_plink: ++ case Opt_noplink: ++ case Opt_list_plink: ++ case Opt_clean_plink: ++ case Opt_diropq_a: ++ case Opt_diropq_w: ++ case Opt_warn_perm: ++ case Opt_nowarn_perm: ++ case Opt_dlgt: ++ case Opt_nodlgt: ++ err = 0; ++ opt->type = token; ++ break; ++ ++ case Opt_udba: ++ opt->udba = udba_val(args[0].from); ++ if (opt->udba >= 0) { ++ err = 0; ++ opt->type = token; ++ } ++ break; ++ ++#if 0 ++ case Opt_coo: ++ opt->coo = coo_val(args[0].from); ++ if (opt->coo >= 0) { ++ err = 0; ++ opt->type = token; ++ } ++ break; ++#endif ++ ++ case Opt_ignore: ++#ifndef CONFIG_AUFS_COMPAT ++ Warn("ignored %s\n", opt_str); ++#endif ++ skipped = 1; ++ err = 0; ++ break; ++ case Opt_err: ++ Err("unknown option %s\n", opt_str); ++ break; ++ } ++ ++ if (!err && !skipped) { ++ if (unlikely(++opt > opt_tail)) { ++ err = -E2BIG; ++ opt--; ++ opt->type = Opt_tail; ++ break; ++ } ++ opt->type = Opt_tail; ++ } ++ } ++ ++ dump_opts(opts); ++ if (unlikely(err)) ++ au_free_opts(opts); ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * returns, ++ * plus: processed without an error ++ * zero: unprocessed ++ */ ++static int au_do_opt_simple(struct super_block *sb, struct opt *opt, ++ int remount, unsigned int *given) ++{ ++ int err; ++ struct aufs_sbinfo *sbinfo = stosi(sb); ++ ++ TraceEnter(); ++ ++ err = 1; /* handled */ ++ switch (opt->type) { ++ case Opt_udba: ++ udba_set(sb, opt->udba); ++ *given |= opt->udba; ++ break; ++ ++ case Opt_plink: ++ au_flag_set(sb, AuFlag_PLINK); ++ *given |= AuFlag_PLINK; ++ break; ++ case Opt_noplink: ++ if (au_flag_test(sb, AuFlag_PLINK)) ++ au_put_plink(sb); ++ au_flag_clr(sb, AuFlag_PLINK); ++ *given |= AuFlag_PLINK; ++ break; ++ case Opt_list_plink: ++ if (au_flag_test(sb, AuFlag_PLINK)) ++ au_list_plink(sb); ++ break; ++ case Opt_clean_plink: ++ if (au_flag_test(sb, AuFlag_PLINK)) ++ au_put_plink(sb); ++ break; ++ ++ case Opt_diropq_a: ++ au_flag_set(sb, AuFlag_ALWAYS_DIROPQ); ++ *given |= AuFlag_ALWAYS_DIROPQ; ++ break; ++ case Opt_diropq_w: ++ au_flag_clr(sb, AuFlag_ALWAYS_DIROPQ); ++ *given |= AuFlag_ALWAYS_DIROPQ; ++ break; ++ ++ case Opt_dlgt: ++ au_flag_set(sb, AuFlag_DLGT); ++ *given |= AuFlag_DLGT; ++ break; ++ case Opt_nodlgt: ++ au_flag_clr(sb, AuFlag_DLGT); ++ *given |= AuFlag_DLGT; ++ break; ++ ++ case Opt_warn_perm: ++ au_flag_set(sb, AuFlag_WARN_PERM); ++ *given |= AuFlag_WARN_PERM; ++ break; ++ case Opt_nowarn_perm: ++ au_flag_clr(sb, AuFlag_WARN_PERM); ++ *given |= AuFlag_WARN_PERM; ++ break; ++ ++ case Opt_coo: ++ coo_set(sb, opt->coo); ++ *given |= opt->coo; ++ break; ++ ++ case Opt_dirwh: ++ sbinfo->si_dirwh = opt->dirwh; ++ break; ++ ++ case Opt_rdcache: ++ sbinfo->si_rdcache = opt->rdcache * HZ; ++ break; ++ ++ default: ++ err = 0; ++ break; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * returns tri-state. ++ * plus: processed without an error ++ * zero: unprocessed ++ * minus: error ++ */ ++static int au_do_opt_br(struct super_block *sb, struct opt *opt, int remount, ++ int *do_refresh) ++{ ++ int err; ++ ++ TraceEnter(); ++ ++ err = 0; ++ switch (opt->type) { ++ case Opt_append: ++ opt->add.bindex = sbend(sb) + 1; ++ goto add; ++ case Opt_prepend: ++ opt->add.bindex = 0; ++ add: ++ case Opt_add: ++ err = br_add(sb, &opt->add, remount); ++ if (!err) ++ *do_refresh = err = 1; ++ break; ++ ++ case Opt_del: ++ case Opt_idel: ++ err = br_del(sb, &opt->del, remount); ++ if (!err) ++ *do_refresh = err = 1; ++ break; ++ ++ case Opt_mod: ++ case Opt_imod: ++ err = br_mod(sb, &opt->mod, remount, do_refresh); ++ if (!err) ++ err = 1; ++ break; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int au_do_opt_xino(struct super_block *sb, struct opt *opt, int remount, ++ struct opt_xino **opt_xino) ++{ ++ int err; ++ ++ TraceEnter(); ++ ++ err = 0; ++ switch (opt->type) { ++ case Opt_xino: ++ err = xino_set(sb, &opt->xino, remount); ++ if (!err) ++ *opt_xino = &opt->xino; ++ break; ++ case Opt_noxino: ++ err = xino_clr(sb); ++ break; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int verify_opts(struct super_block *sb, int remount) ++{ ++ int err; ++ aufs_bindex_t bindex, bend; ++ struct aufs_branch *br; ++ struct dentry *root; ++ struct inode *dir; ++ unsigned int do_plink; ++ ++ TraceEnter(); ++ ++ if (unlikely(!(sb->s_flags & MS_RDONLY) ++ && !br_writable(sbr_perm(sb, 0)))) ++ Warn("first branch should be rw\n"); ++ ++ err = 0; ++ root = sb->s_root; ++ dir = sb->s_root->d_inode; ++ do_plink = au_flag_test(sb, AuFlag_PLINK); ++ bend = sbend(sb); ++ for (bindex = 0; !err && bindex <= bend; bindex++) { ++ struct inode *h_dir; ++ int skip; ++ ++ skip = 0; ++ h_dir = au_h_iptr_i(dir, bindex); ++ br = stobr(sb, bindex); ++ br_wh_read_lock(br); ++ switch (br->br_perm) { ++ case AuBr_RR: ++ case AuBr_RO: ++ case AuBr_RRWH: ++ case AuBr_ROWH: ++ skip = (!br->br_wh && !br->br_plink); ++ break; ++ ++ case AuBr_RWNoLinkWH: ++ skip = !br->br_wh; ++ if (skip) { ++ if (do_plink) ++ skip = !!br->br_plink; ++ else ++ skip = !br->br_plink; ++ } ++ break; ++ ++ case AuBr_RW: ++ skip = !!br->br_wh; ++ if (skip) { ++ if (do_plink) ++ skip = !!br->br_plink; ++ else ++ skip = !br->br_plink; ++ } ++ break; ++ ++ default: ++ BUG(); ++ } ++ br_wh_read_unlock(br); ++ ++ if (skip) ++ continue; ++ ++ hdir_lock(h_dir, dir, bindex); ++ br_wh_write_lock(br); ++ err = init_wh(au_h_dptr_i(root, bindex), br, ++ au_nfsmnt(sb, bindex), sb); ++ br_wh_write_unlock(br); ++ hdir_unlock(h_dir, dir, bindex); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++int au_do_opts_mount(struct super_block *sb, struct opts *opts) ++{ ++ int err, do_refresh; ++ struct inode *dir; ++ struct opt *opt; ++ unsigned int flags, given; ++ struct opt_xino *opt_xino; ++ aufs_bindex_t bend, bindex; ++ ++ TraceEnter(); ++ SiMustWriteLock(sb); ++ DiMustWriteLock(sb->s_root); ++ dir = sb->s_root->d_inode; ++ IiMustWriteLock(dir); ++ ++ err = 0; ++ given = 0; ++ opt_xino = NULL; ++ opt = opts->opt; ++ while (err >= 0 && opt->type != Opt_tail) ++ err = au_do_opt_simple(sb, opt++, /*remount*/0, &given); ++ if (err > 0) ++ err = 0; ++ else if (unlikely(err < 0)) ++ goto out; ++ ++ /* disable them temporary */ ++ flags = au_flag_test(sb, AuFlag_XINO | AuMask_UDBA | AuFlag_DLGT); ++ au_flag_clr(sb, AuFlag_XINO | AuFlag_DLGT); ++ udba_set(sb, AuFlag_UDBA_REVAL); ++ ++ do_refresh = 0; ++ opt = opts->opt; ++ while (err >= 0 && opt->type != Opt_tail) ++ err = au_do_opt_br(sb, opt++, /*remount*/0, &do_refresh); ++ if (err > 0) ++ err = 0; ++ else if (unlikely(err < 0)) ++ goto out; ++ ++ bend = sbend(sb); ++ if (unlikely(bend < 0)) { ++ err = -EINVAL; ++ Err("no branches\n"); ++ goto out; ++ } ++ ++ if (flags & AuFlag_XINO) ++ au_flag_set(sb, AuFlag_XINO); ++ opt = opts->opt; ++ while (!err && opt->type != Opt_tail) ++ err = au_do_opt_xino(sb, opt++, /*remount*/0, &opt_xino); ++ if (unlikely(err)) ++ goto out; ++ ++ //todo: test this error case. ++ err = verify_opts(sb, /*remount*/0); ++ DEBUG_ON(err); ++ if (unlikely(err)) ++ goto out; ++ ++ /* enable xino */ ++ if (au_flag_test(sb, AuFlag_XINO) && !opt_xino) { ++ struct file *xino_file = xino_def(sb); ++ err = PTR_ERR(xino_file); ++ if (IS_ERR(xino_file)) ++ goto out; ++ ++ err = 0; ++ for (bindex = 0; !err && bindex <= bend; bindex++) ++ err = xino_init(sb, bindex, xino_file, ++ /*do_test*/bindex); ++ fput(xino_file); ++ if (unlikely(err)) ++ goto out; ++ } ++ ++ /* restore hinotify */ ++ udba_set(sb, flags & AuMask_UDBA); ++ if (flags & AuFlag_UDBA_INOTIFY) ++ au_reset_hinotify(dir, au_hi_flags(dir, 1) & ~AUFS_HI_XINO); ++ ++ /* restore dlgt */ ++ if (flags & AuFlag_DLGT) ++ au_flag_set(sb, AuFlag_DLGT); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++int au_do_opts_remount(struct super_block *sb, struct opts *opts, ++ int *do_refresh, unsigned int *given) ++{ ++ int err, rerr; ++ struct inode *dir; ++ struct opt_xino *opt_xino; ++ struct opt *opt; ++ unsigned int dlgt; ++ ++ TraceEnter(); ++ SiMustWriteLock(sb); ++ DiMustWriteLock(sb->s_root); ++ dir = sb->s_root->d_inode; ++ IiMustWriteLock(dir); ++ //DEBUG_ON(au_flag_test(sb, AuFlag_UDBA_INOTIFY)); ++ ++ err = 0; ++ *do_refresh = 0; ++ *given = 0; ++ dlgt = au_flag_test(sb, AuFlag_DLGT); ++ opt_xino = NULL; ++ opt = opts->opt; ++ while (err >= 0 && opt->type != Opt_tail) { ++ err = au_do_opt_simple(sb, opt, /*remount*/1, given); ++ ++ /* disable it temporary */ ++ dlgt = au_flag_test(sb, AuFlag_DLGT); ++ au_flag_clr(sb, AuFlag_DLGT); ++ ++ if (!err) ++ err = au_do_opt_br(sb, opt, /*remount*/1, do_refresh); ++ if (!err) ++ err = au_do_opt_xino(sb, opt, /*remount*/1, &opt_xino); ++ ++ /* restore it */ ++ au_flag_set(sb, dlgt); ++ opt++; ++ } ++ if (err > 0) ++ err = 0; ++ TraceErr(err); ++ ++ /* go on if err */ ++ ++ //todo: test this error case. ++ au_flag_clr(sb, AuFlag_DLGT); ++ rerr = verify_opts(sb, /*remount*/1); ++ au_flag_set(sb, dlgt); ++ ++ /* they are handled by the caller */ ++ if (!*do_refresh) ++ *do_refresh = !!((*given & AuMask_UDBA) ++ || au_flag_test(sb, AuFlag_XINO)); ++ ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/opts.h b/fs/aufs/opts.h +new file mode 100755 +index 0000000..16c1a6a +--- /dev/null ++++ b/fs/aufs/opts.h +@@ -0,0 +1,96 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: opts.h,v 1.13 2007/05/14 06:27:18 sfjro Exp $ */ ++ ++#ifndef __AUFS_OPTS_H__ ++#define __AUFS_OPTS_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/namei.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,22) ++typedef const char* au_parser_pattern_t; ++#else ++typedef char* au_parser_pattern_t; ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct opt_add { ++ aufs_bindex_t bindex; ++ char *path; ++ int perm; ++ struct nameidata nd; ++}; ++ ++struct opt_del { ++ char *path; ++ struct dentry *h_root; ++}; ++ ++struct opt_mod { ++ char *path; ++ int perm; ++ struct dentry *h_root; ++}; ++ ++struct opt_xino { ++ char *path; ++ struct file *file; ++}; ++ ++struct opt { ++ int type; ++ union { ++ struct opt_xino xino; ++ struct opt_add add; ++ struct opt_del del; ++ struct opt_mod mod; ++ int dirwh; ++ int rdcache; ++ int deblk; ++ int nhash; ++ int udba; ++ int coo; ++ }; ++}; ++ ++struct opts { ++ struct opt *opt; ++ int max_opt; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++int br_perm_str(char *p, unsigned int len, int brperm); ++au_parser_pattern_t udba_str(int udba); ++void udba_set(struct super_block *sb, unsigned int flg); ++//au_parser_pattern_t coo_str(int coo); ++void au_free_opts(struct opts *opts); ++int au_parse_opts(struct super_block *sb, char *str, struct opts *opts); ++int au_do_opts_mount(struct super_block *sb, struct opts *opts); ++int au_do_opts_remount(struct super_block *sb, struct opts *opts, ++ int *do_refresh, unsigned int *given); ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_OPTS_H__ */ +diff --git a/fs/aufs/plink.c b/fs/aufs/plink.c +new file mode 100755 +index 0000000..0e520af +--- /dev/null ++++ b/fs/aufs/plink.c +@@ -0,0 +1,331 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: plink.c,v 1.4 2007/05/14 03:39:10 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++struct pseudo_link { ++ struct list_head list; ++ struct inode *inode; ++}; ++ ++#ifdef CONFIG_AUFS_DEBUG ++void au_list_plink(struct super_block *sb) ++{ ++ struct aufs_sbinfo *sbinfo; ++ struct list_head *plink_list; ++ struct pseudo_link *plink; ++ ++ TraceEnter(); ++ SiMustAnyLock(sb); ++ DEBUG_ON(!au_flag_test(sb, AuFlag_PLINK)); ++ ++ sbinfo = stosi(sb); ++ plink_list = &sbinfo->si_plink; ++ spin_lock(&sbinfo->si_plink_lock); ++ list_for_each_entry(plink, plink_list, list) ++ Dbg("%lu\n", plink->inode->i_ino); ++ spin_unlock(&sbinfo->si_plink_lock); ++} ++#endif ++ ++int au_is_plinked(struct super_block *sb, struct inode *inode) ++{ ++ int found; ++ struct aufs_sbinfo *sbinfo; ++ struct list_head *plink_list; ++ struct pseudo_link *plink; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ SiMustAnyLock(sb); ++ DEBUG_ON(!au_flag_test(sb, AuFlag_PLINK)); ++ ++ found = 0; ++ sbinfo = stosi(sb); ++ plink_list = &sbinfo->si_plink; ++ spin_lock(&sbinfo->si_plink_lock); ++ list_for_each_entry(plink, plink_list, list) ++ if (plink->inode == inode) { ++ found = 1; ++ break; ++ } ++ spin_unlock(&sbinfo->si_plink_lock); ++ return found; ++} ++ ++// 20 is max digits length of ulong 64 ++#define PLINK_NAME_LEN ((20 + 1) * 2) ++ ++static int plink_name(char *name, int len, struct inode *inode, ++ aufs_bindex_t bindex) ++{ ++ int rlen; ++ struct inode *h_inode; ++ ++ LKTRTrace("i%lu, b%d\n", inode->i_ino, bindex); ++ DEBUG_ON(len != PLINK_NAME_LEN); ++ h_inode = au_h_iptr_i(inode, bindex); ++ DEBUG_ON(!h_inode); ++ rlen = snprintf(name, len, "%lu.%lu", inode->i_ino, h_inode->i_ino); ++ DEBUG_ON(rlen >= len); ++ return rlen; ++} ++ ++struct dentry *lkup_plink(struct super_block *sb, aufs_bindex_t bindex, ++ struct inode *inode) ++{ ++ struct dentry *h_dentry, *h_parent; ++ struct aufs_branch *br; ++ struct inode *h_dir; ++ char tgtname[PLINK_NAME_LEN]; ++ int len; ++ struct lkup_args lkup; ++ ++ LKTRTrace("b%d, i%lu\n", bindex, inode->i_ino); ++ br = stobr(sb, bindex); ++ h_parent = br->br_plink; ++ DEBUG_ON(!h_parent); ++ h_dir = h_parent->d_inode; ++ DEBUG_ON(!h_dir); ++ ++ len = plink_name(tgtname, sizeof(tgtname), inode, bindex); ++ ++ // always superio. ++ lkup.nfsmnt = au_do_nfsmnt(br->br_mnt); ++ lkup.dlgt = need_dlgt(sb); ++ hi_lock_whplink(h_dir); ++ h_dentry = sio_lkup_one(tgtname, h_parent, len, &lkup); ++ i_unlock(h_dir); ++ return h_dentry; ++} ++ ++static int do_whplink(char *tgt, int len, struct dentry *h_parent, ++ struct dentry *h_dentry, struct vfsmount *nfsmnt, ++ struct super_block *sb) ++{ ++ int err; ++ struct dentry *h_tgt; ++ struct inode *h_dir; ++ struct lkup_args lkup = { ++ .nfsmnt = nfsmnt, ++ .dlgt = need_dlgt(sb) ++ }; ++ ++ h_tgt = lkup_one(tgt, h_parent, len, &lkup); ++ err = PTR_ERR(h_tgt); ++ if (IS_ERR(h_tgt)) ++ goto out; ++ ++ err = 0; ++ h_dir = h_parent->d_inode; ++ if (unlikely(h_tgt->d_inode && h_tgt->d_inode != h_dentry->d_inode)) ++ err = vfsub_unlink(h_dir, h_tgt, lkup.dlgt); ++ if (!err && !h_tgt->d_inode) { ++ err = vfsub_link(h_dentry, h_dir, h_tgt, lkup.dlgt); ++ //inode->i_nlink++; ++ } ++ dput(h_tgt); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++struct do_whplink_args { ++ int *errp; ++ char *tgt; ++ int len; ++ struct dentry *h_parent; ++ struct dentry *h_dentry; ++ struct vfsmount *nfsmnt; ++ struct super_block *sb; ++}; ++ ++static void call_do_whplink(void *args) ++{ ++ struct do_whplink_args *a = args; ++ *a->errp = do_whplink(a->tgt, a->len, a->h_parent, a->h_dentry, ++ a->nfsmnt, a->sb); ++} ++ ++static int whplink(struct dentry *h_dentry, struct inode *inode, ++ aufs_bindex_t bindex, struct super_block *sb) ++{ ++ int err, len; ++ struct aufs_branch *br; ++ struct dentry *h_parent; ++ struct inode *h_dir; ++ char tgtname[PLINK_NAME_LEN]; ++ ++ LKTRTrace("%.*s\n", DLNPair(h_dentry)); ++ br = stobr(inode->i_sb, bindex); ++ h_parent = br->br_plink; ++ DEBUG_ON(!h_parent); ++ h_dir = h_parent->d_inode; ++ DEBUG_ON(!h_dir); ++ ++ len = plink_name(tgtname, sizeof(tgtname), inode, bindex); ++ ++ // always superio. ++ hi_lock_whplink(h_dir); ++ if (!is_au_wkq(current)) { ++ struct do_whplink_args args = { ++ .errp = &err, ++ .tgt = tgtname, ++ .len = len, ++ .h_parent = h_parent, ++ .h_dentry = h_dentry, ++ .nfsmnt = au_do_nfsmnt(br->br_mnt), ++ .sb = sb ++ }; ++ au_wkq_wait(call_do_whplink, &args, /*dlgt*/0); ++ } else ++ err = do_whplink(tgtname, len, h_parent, h_dentry, ++ au_do_nfsmnt(br->br_mnt), sb); ++ i_unlock(h_dir); ++ ++ TraceErr(err); ++ return err; ++} ++ ++void append_plink(struct super_block *sb, struct inode *inode, ++ struct dentry *h_dentry, aufs_bindex_t bindex) ++{ ++ struct aufs_sbinfo *sbinfo; ++ struct list_head *plink_list; ++ struct pseudo_link *plink; ++ int found, err, cnt; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ SiMustAnyLock(sb); ++ DEBUG_ON(!au_flag_test(sb, AuFlag_PLINK)); ++ ++ cnt = 0; ++ found = 0; ++ sbinfo = stosi(sb); ++ plink_list = &sbinfo->si_plink; ++ spin_lock(&sbinfo->si_plink_lock); ++ list_for_each_entry(plink, plink_list, list) { ++ cnt++; ++ if (plink->inode == inode) { ++ found = 1; ++ break; ++ } ++ } ++ ++ err = 0; ++ if (!found) { ++ struct pseudo_link *plink; ++ ++ plink = kmalloc(sizeof(*plink), GFP_ATOMIC); ++ if (plink) { ++ plink->inode = igrab(inode); ++ list_add(&plink->list, plink_list); ++ cnt++; ++ } else ++ err = -ENOMEM; ++ } ++ spin_unlock(&sbinfo->si_plink_lock); ++ ++ if (!err) ++ err = whplink(h_dentry, inode, bindex, sb); ++ ++ if (unlikely(cnt > 100)) ++ Warn1("unexpectedly many pseudo links, %d\n", cnt); ++ if (unlikely(err)) ++ Warn("err %d, damaged pseudo link. ignored.\n", err); ++} ++ ++static void do_put_plink(struct pseudo_link *plink, int do_del) ++{ ++ TraceEnter(); ++ ++ iput(plink->inode); ++ if (do_del) ++ list_del(&plink->list); ++ kfree(plink); ++} ++ ++void au_put_plink(struct super_block *sb) ++{ ++ struct aufs_sbinfo *sbinfo; ++ struct list_head *plink_list; ++ struct pseudo_link *plink, *tmp; ++ ++ TraceEnter(); ++ SiMustWriteLock(sb); ++ DEBUG_ON(!au_flag_test(sb, AuFlag_PLINK)); ++ ++ sbinfo = stosi(sb); ++ plink_list = &sbinfo->si_plink; ++ //spin_lock(&sbinfo->si_plink_lock); ++ list_for_each_entry_safe(plink, tmp, plink_list, list) ++ do_put_plink(plink, 0); ++ INIT_LIST_HEAD(plink_list); ++ //spin_unlock(&sbinfo->si_plink_lock); ++} ++ ++void half_refresh_plink(struct super_block *sb, aufs_bindex_t br_id) ++{ ++ struct aufs_sbinfo *sbinfo; ++ struct list_head *plink_list; ++ struct pseudo_link *plink, *tmp; ++ struct inode *inode; ++ aufs_bindex_t bstart, bend, bindex; ++ int do_put; ++ ++ TraceEnter(); ++ SiMustWriteLock(sb); ++ DEBUG_ON(!au_flag_test(sb, AuFlag_PLINK)); ++ ++ sbinfo = stosi(sb); ++ plink_list = &sbinfo->si_plink; ++ //spin_lock(&sbinfo->si_plink_lock); ++ list_for_each_entry_safe(plink, tmp, plink_list, list) { ++ do_put = 0; ++ inode = igrab(plink->inode); ++ ii_write_lock_child(inode); ++ bstart = ibstart(inode); ++ bend = ibend(inode); ++ if (bstart >= 0) { ++ for (bindex = bstart; bindex <= bend; bindex++) { ++ if (!au_h_iptr_i(inode, bindex) ++ || itoid_index(inode, bindex) != br_id) ++ continue; ++ set_h_iptr(inode, bindex, NULL, 0); ++ do_put = 1; ++ break; ++ } ++ } else ++ do_put_plink(plink, 1); ++ ++ if (do_put) { ++ for (bindex = bstart; bindex <= bend; bindex++) ++ if (au_h_iptr_i(inode, bindex)) { ++ do_put = 0; ++ break; ++ } ++ if (do_put) ++ do_put_plink(plink, 1); ++ } ++ ii_write_unlock(inode); ++ iput(inode); ++ } ++ //spin_unlock(&sbinfo->si_plink_lock); ++} +diff --git a/fs/aufs/sbinfo.c b/fs/aufs/sbinfo.c +new file mode 100755 +index 0000000..55cb64c +--- /dev/null ++++ b/fs/aufs/sbinfo.c +@@ -0,0 +1,173 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: sbinfo.c,v 1.30 2007/05/14 03:39:31 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++struct aufs_sbinfo *stosi(struct super_block *sb) ++{ ++ struct aufs_sbinfo *sbinfo; ++ sbinfo = sb->s_fs_info; ++ //DEBUG_ON(sbinfo->si_bend < 0); ++ return sbinfo; ++} ++ ++aufs_bindex_t sbend(struct super_block *sb) ++{ ++ SiMustAnyLock(sb); ++ return stosi(sb)->si_bend; ++} ++ ++struct aufs_branch *stobr(struct super_block *sb, aufs_bindex_t bindex) ++{ ++ SiMustAnyLock(sb); ++ DEBUG_ON(bindex < 0 || sbend(sb) < bindex ++ || !stosi(sb)->si_branch[0 + bindex]); ++ return stosi(sb)->si_branch[0 + bindex]; ++} ++ ++int au_sigen(struct super_block *sb) ++{ ++ SiMustAnyLock(sb); ++ return stosi(sb)->si_generation; ++} ++ ++int au_sigen_inc(struct super_block *sb) ++{ ++ int gen; ++ ++ SiMustWriteLock(sb); ++ gen = ++stosi(sb)->si_generation; ++ au_update_digen(sb->s_root); ++ au_update_iigen(sb->s_root->d_inode); ++ sb->s_root->d_inode->i_version++; ++ return gen; ++} ++ ++int find_bindex(struct super_block *sb, struct aufs_branch *br) ++{ ++ aufs_bindex_t bindex, bend; ++ ++ bend = sbend(sb); ++ for (bindex = 0; bindex <= bend; bindex++) ++ if (stobr(sb, bindex) == br) ++ return bindex; ++ return -1; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* dentry and super_block lock. call at entry point */ ++void aufs_read_lock(struct dentry *dentry, int flags) ++{ ++ si_read_lock(dentry->d_sb); ++ if (flags & AUFS_D_WLOCK) ++ di_write_lock_child(dentry); ++ else ++ di_read_lock_child(dentry, flags); ++} ++ ++void aufs_read_unlock(struct dentry *dentry, int flags) ++{ ++ if (flags & AUFS_D_WLOCK) ++ di_write_unlock(dentry); ++ else ++ di_read_unlock(dentry, flags); ++ si_read_unlock(dentry->d_sb); ++} ++ ++void aufs_write_lock(struct dentry *dentry) ++{ ++ //au_wkq_wait_nwtask(); ++ si_write_lock(dentry->d_sb); ++ di_write_lock_child(dentry); ++} ++ ++void aufs_write_unlock(struct dentry *dentry) ++{ ++ di_write_unlock(dentry); ++ si_write_unlock(dentry->d_sb); ++ //au_wkq_wait_nwtask(); ++} ++ ++void aufs_read_and_write_lock2(struct dentry *d1, struct dentry *d2, int isdir) ++{ ++ DEBUG_ON(d1 == d2 || d1->d_sb != d2->d_sb); ++ si_read_lock(d1->d_sb); ++ di_write_lock2_child(d1, d2, isdir); ++} ++ ++void aufs_read_and_write_unlock2(struct dentry *d1, struct dentry *d2) ++{ ++ DEBUG_ON(d1 == d2 || d1->d_sb != d2->d_sb); ++ di_write_unlock2(d1, d2); ++ si_read_unlock(d1->d_sb); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++aufs_bindex_t new_br_id(struct super_block *sb) ++{ ++ aufs_bindex_t br_id; ++ ++ TraceEnter(); ++ SiMustWriteLock(sb); ++ ++ while (1) { ++ br_id = ++stosi(sb)->si_last_br_id; ++ if (br_id && find_brindex(sb, br_id) < 0) ++ return br_id; ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_SYSAUFS ++static int make_xino(struct seq_file *seq, struct sysaufs_args *args, ++ int *do_size) ++{ ++ int err; ++ struct super_block *sb = args->sb; ++ aufs_bindex_t bindex, bend; ++ struct file *xf; ++ struct inode *xi; ++ ++ TraceEnter(); ++ DEBUG_ON(args->index != SysaufsSb_XINO); ++ SiMustReadLock(sb); ++ ++ *do_size = 0; ++ err = seq_printf(seq, "%d %lu\n", sizeof(struct xino), ++ atomic_long_read(&stosi(sb)->si_xino)); ++ bend = sbend(sb); ++ for (bindex = 0; !err && bindex <= bend; bindex++) { ++ xf = stobr(sb, bindex)->br_xino; ++ xi = xf->f_dentry->d_inode; ++ err = seq_printf(seq, "%d: %d, %Lux%d %Ld\n", ++ bindex, file_count(xf), ++ (u64)xi->i_blocks, 1 << xi->i_blkbits, ++ i_size_read(xi)); ++ } ++ return err; ++} ++ ++sysaufs_op au_si_ops[] = { ++ [SysaufsSb_XINO] = make_xino ++}; ++#endif +diff --git a/fs/aufs/super.c b/fs/aufs/super.c +new file mode 100755 +index 0000000..c1123f8 +--- /dev/null ++++ b/fs/aufs/super.c +@@ -0,0 +1,716 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: super.c,v 1.50 2007/05/14 03:39:42 sfjro Exp $ */ ++ ++#include <linux/module.h> ++#include <linux/seq_file.h> ++#include <linux/statfs.h> ++#include "aufs.h" ++ ++/* ++ * super_operations ++ */ ++static struct inode *aufs_alloc_inode(struct super_block *sb) ++{ ++ struct aufs_icntnr *c; ++ ++ TraceEnter(); ++ ++ c = cache_alloc_icntnr(); ++ //if (LktrCond) {cache_free_icntnr(c); c = NULL;} ++ if (c) { ++ inode_init_once(&c->vfs_inode); ++ c->vfs_inode.i_version = 1; //sigen(sb); ++ c->iinfo.ii_hinode = NULL; ++ return &c->vfs_inode; ++ } ++ return NULL; ++} ++ ++static void aufs_destroy_inode(struct inode *inode) ++{ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ au_iinfo_fin(inode); ++ cache_free_icntnr(container_of(inode, struct aufs_icntnr, vfs_inode)); ++} ++ ++//todo: how about merge with alloc_inode()? ++static void aufs_read_inode(struct inode *inode) ++{ ++ int err; ++ ++ LKTRTrace("i%lu\n", inode->i_ino); ++ ++ err = au_iinfo_init(inode); ++ //if (LktrCond) err = -1; ++ if (!err) { ++ inode->i_version++; ++ inode->i_op = &aufs_iop; ++ inode->i_fop = &aufs_file_fop; ++ inode->i_mapping->a_ops = &aufs_aop; ++ return; /* success */ ++ } ++ ++ LKTRTrace("intializing inode info failed(%d)\n", err); ++ make_bad_inode(inode); ++} ++ ++int au_show_brs(struct seq_file *seq, struct super_block *sb) ++{ ++ int err; ++ aufs_bindex_t bindex, bend; ++ char a[16]; ++ struct dentry *root; ++ ++ TraceEnter(); ++ SiMustAnyLock(sb); ++ root = sb->s_root; ++ DiMustAnyLock(root); ++ ++ err = 0; ++ bend = sbend(sb); ++ for (bindex = 0; !err && bindex <= bend; bindex++) { ++ err = br_perm_str(a, sizeof(a), sbr_perm(sb, bindex)); ++ if (!err) ++ err = seq_path(seq, sbr_mnt(sb, bindex), ++ au_h_dptr_i(root, bindex), au_esc_chars); ++ if (err > 0) ++ err = seq_printf(seq, "=%s", a); ++ if (!err && bindex != bend) ++ err = seq_putc(seq, ':'); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int aufs_show_options(struct seq_file *m, struct vfsmount *mnt) ++{ ++ int err, n; ++ struct super_block *sb; ++ struct aufs_sbinfo *sbinfo; ++ struct dentry *root; ++ struct file *xino; ++ ++ TraceEnter(); ++ ++ sb = mnt->mnt_sb; ++ root = sb->s_root; ++ aufs_read_lock(root, !AUFS_I_RLOCK); ++ if (au_flag_test(sb, AuFlag_XINO)) { ++ err = seq_puts(m, ",xino="); ++ if (unlikely(err)) ++ goto out; ++ xino = stobr(sb, 0)->br_xino; ++ err = seq_path(m, xino->f_vfsmnt, xino->f_dentry, au_esc_chars); ++ if (unlikely(err <= 0)) ++ goto out; ++ err = 0; ++ ++#define Deleted "\\040(deleted)" ++ m->count -= sizeof(Deleted) - 1; ++ DEBUG_ON(memcmp(m->buf + m->count, Deleted, ++ sizeof(Deleted) - 1)); ++#undef Deleted ++ } else ++ err = seq_puts(m, ",noxino"); ++ ++ n = au_flag_test(sb, AuFlag_PLINK); ++ if (unlikely(!err && (AuDefFlags & AuFlag_PLINK) != n)) ++ err = seq_printf(m, ",%splink", n ? "" : "no"); ++ n = au_flag_test_udba(sb); ++ if (unlikely(!err && (AuDefFlags & AuMask_UDBA) != n)) ++ err = seq_printf(m, ",udba=%s", udba_str(n)); ++ n = au_flag_test(sb, AuFlag_ALWAYS_DIROPQ); ++ if (unlikely(!err && (AuDefFlags & AuFlag_ALWAYS_DIROPQ) != n)) ++ err = seq_printf(m, ",diropq=%c", n ? 'a' : 'w'); ++ n = au_flag_test(sb, AuFlag_DLGT); ++ if (unlikely(!err && (AuDefFlags & AuFlag_DLGT) != n)) ++ err = seq_printf(m, ",%sdlgt", n ? "" : "no"); ++ n = au_flag_test(sb, AuFlag_WARN_PERM); ++ if (unlikely(!err && (AuDefFlags & AuFlag_WARN_PERM) != n)) ++ err = seq_printf(m, ",%swarn_perm", n ? "" : "no"); ++ ++ sbinfo = stosi(sb); ++ n = sbinfo->si_dirwh; ++ if (unlikely(!err && n != AUFS_DIRWH_DEF)) ++ err = seq_printf(m, ",dirwh=%d", n); ++ n = sbinfo->si_rdcache / HZ; ++ if (unlikely(!err && n != AUFS_RDCACHE_DEF)) ++ err = seq_printf(m, ",rdcache=%d", n); ++#if 0 ++ n = au_flag_test_coo(sb); ++ if (unlikely(!err && (AuDefFlags & AuMask_COO) != n)) ++ err = seq_printf(m, ",coo=%s", coo_str(n)); ++#endif ++ ++ if (!err && !sysaufs_brs) { ++#ifdef CONFIG_AUFS_COMPAT ++ err = seq_puts(m, ",dirs="); ++#else ++ err = seq_puts(m, ",br:"); ++#endif ++ if (!err) ++ err = au_show_brs(m, sb); ++ } ++ ++ out: ++ aufs_read_unlock(root, !AUFS_I_RLOCK); ++ TraceErr(err); ++ if (err) ++ err = -E2BIG; ++ TraceErr(err); ++ return err; ++} ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++#define StatfsLock(d) aufs_read_lock((d)->d_sb->s_root, 0) ++#define StatfsUnlock(d) aufs_read_unlock((d)->d_sb->s_root, 0) ++#define StatfsArg(d) au_h_dptr((d)->d_sb->s_root) ++#define StatfsHInode(d) (StatfsArg(d)->d_inode) ++#define StatfsSb(d) ((d)->d_sb) ++static int aufs_statfs(struct dentry *arg, struct kstatfs *buf) ++#else ++#define StatfsLock(s) si_read_lock(s) ++#define StatfsUnlock(s) si_read_unlock(s) ++#define StatfsArg(s) sbr_sb(s, 0) ++#define StatfsHInode(s) (StatfsArg(s)->s_root->d_inode) ++#define StatfsSb(s) (s) ++static int aufs_statfs(struct super_block *arg, struct kstatfs *buf) ++#endif ++{ ++ int err; ++ ++ TraceEnter(); ++ ++ StatfsLock(arg); ++ err = vfsub_statfs(StatfsArg(arg), buf, need_dlgt(StatfsSb(arg))); ++ //if (LktrCond) err = -1; ++ StatfsUnlock(arg); ++ if (!err) { ++ //buf->f_type = AUFS_SUPER_MAGIC; ++ buf->f_type = 0; ++ buf->f_namelen -= AUFS_WH_PFX_LEN; ++ memset(&buf->f_fsid, 0, sizeof(buf->f_fsid)); ++ } ++ //buf->f_bsize = buf->f_blocks = buf->f_bfree = buf->f_bavail = -1; ++ ++ TraceErr(err); ++ return err; ++} ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) || defined(UbuntuEdgy17Umount18) ++#define UmountBeginSb(mnt) (mnt)->mnt_sb ++static void aufs_umount_begin(struct vfsmount *arg, int flags) ++#else ++#define UmountBeginSb(sb) sb ++static void aufs_umount_begin(struct super_block *arg) ++#endif ++{ ++ struct super_block *sb = UmountBeginSb(arg); ++ ++ if (unlikely(!stosi(sb))) ++ return; ++ ++ //au_wkq_wait_nwtask(); ++ si_write_lock(sb); ++ if (au_flag_test(sb, AuFlag_PLINK)) { ++ au_put_plink(sb); ++ //kobj_umount(stosi(sb)); ++ } ++#if 0 ++ if (unlikely(au_flag_test(sb, AuFlag_UDBA_INOTIFY))) ++ shrink_dcache_sb(sb); ++#endif ++ si_write_unlock(sb); ++} ++ ++static void free_sbinfo(struct aufs_sbinfo *sbinfo) ++{ ++ TraceEnter(); ++ DEBUG_ON(!sbinfo ++ || !list_empty(&sbinfo->si_plink)); ++ ++ free_branches(sbinfo); ++ kfree(sbinfo->si_branch); ++ kfree(sbinfo); ++} ++ ++/* final actions when unmounting a file system */ ++static void aufs_put_super(struct super_block *sb) ++{ ++ struct aufs_sbinfo *sbinfo; ++ ++ TraceEnter(); ++ ++ sbinfo = stosi(sb); ++ if (unlikely(!sbinfo)) ++ return; ++ ++ sysaufs_del(sbinfo); ++ ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,18) && !defined(UbuntuEdgy17Umount18) ++ // umount_begin() may not be called. ++ aufs_umount_begin(sb); ++#endif ++ free_sbinfo(sbinfo); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * refresh directories at remount time. ++ */ ++static int do_refresh_dir(struct dentry *dentry, unsigned int flags) ++{ ++ int err; ++ struct dentry *parent; ++ struct inode *inode; ++ ++ LKTRTrace("%.*s\n", DLNPair(dentry)); ++ inode = dentry->d_inode; ++ DEBUG_ON(!inode || !S_ISDIR(inode->i_mode)); ++ ++ di_write_lock_child(dentry); ++ parent = dget_parent(dentry); ++ di_read_lock_parent(parent, AUFS_I_RLOCK); ++ err = au_refresh_hdentry(dentry, S_IFDIR); ++ if (err >= 0) { ++ err = au_refresh_hinode(inode, dentry); ++ if (!err) ++ au_reset_hinotify(inode, flags); ++ } ++ if (unlikely(err)) ++ Err("unrecoverable error %d\n", err); ++ di_read_unlock(parent, AUFS_I_RLOCK); ++ dput(parent); ++ di_write_unlock(dentry); ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int test_dir(struct dentry *dentry, void *arg) ++{ ++ return S_ISDIR(dentry->d_inode->i_mode); ++} ++ ++static int refresh_dir(struct dentry *root, int sgen) ++{ ++ int err, i, j, ndentry; ++ const unsigned int flags = au_hi_flags(root->d_inode, /*isdir*/1); ++ struct au_dcsub_pages dpages; ++ struct au_dpage *dpage; ++ struct dentry **dentries; ++ ++ LKTRTrace("sgen %d\n", sgen); ++ SiMustWriteLock(root->d_sb); ++ DEBUG_ON(au_digen(root) != sgen); ++ DiMustWriteLock(root); ++ ++ err = au_dpages_init(&dpages, GFP_KERNEL); ++ if (unlikely(err)) ++ goto out; ++ err = au_dcsub_pages(&dpages, root, test_dir, NULL); ++ if (unlikely(err)) ++ goto out_dpages; ++ ++ DiMustNoWaiters(root); ++ IiMustNoWaiters(root->d_inode); ++ di_write_unlock(root); ++ for (i = 0; !err && i < dpages.ndpage; i++) { ++ dpage = dpages.dpages + i; ++ dentries = dpage->dentries; ++ ndentry = dpage->ndentry; ++ for (j = 0; !err && j < ndentry; j++) { ++ struct dentry *d; ++ d = dentries[j]; ++ DEBUG_ON(!S_ISDIR(d->d_inode->i_mode) ++ || IS_ROOT(d) ++ || au_digen(d->d_parent) != sgen); ++ if (au_digen(d) != sgen) ++ err = do_refresh_dir(d, flags); ++ } ++ } ++ di_write_lock_child(root); /* aufs_write_lock() calls ..._child() */ ++ ++ out_dpages: ++ au_dpages_free(&dpages); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* stop extra interpretation of errno in mount(8), and strange error messages */ ++static int cvt_err(int err) ++{ ++ TraceErr(err); ++ ++ switch (err) { ++ case -ENOENT: ++ case -ENOTDIR: ++ case -EEXIST: ++ case -EIO: ++ err = -EINVAL; ++ } ++ return err; ++} ++ ++/* protected by s_umount */ ++static int aufs_remount_fs(struct super_block *sb, int *flags, char *data) ++{ ++ int err, do_refresh; ++ struct dentry *root; ++ struct inode *inode; ++ struct opts opts; ++ unsigned int given, dlgt; ++ ++ //au_debug_on(); ++ LKTRTrace("flags 0x%x, data %s, len %d\n", ++ *flags, data ? data : "NULL", data ? strlen(data) : 0); ++ ++ err = 0; ++ if (unlikely(!data || !*data)) ++ goto out; /* success */ ++ ++ err = -ENOMEM; ++ memset(&opts, 0, sizeof(opts)); ++ opts.opt = (void*)__get_free_page(GFP_KERNEL); ++ //if (LktrCond) {free_page((unsigned long)opts.opt); opts.opt = NULL;} ++ if (unlikely(!opts.opt)) ++ goto out; ++ opts.max_opt = PAGE_SIZE / sizeof(*opts.opt); ++ ++ /* parse it before aufs lock */ ++ err = au_parse_opts(sb, data, &opts); ++ //if (LktrCond) {au_free_opts(&opts); err = -1;} ++ if (unlikely(err)) ++ goto out_opts; ++ ++ root = sb->s_root; ++ inode = root->d_inode; ++ i_lock(inode); ++ aufs_write_lock(root); ++ ++ //DbgSleep(3); ++ ++ /* au_do_opts() may return an error */ ++ do_refresh = 0; ++ given = 0; ++ err = au_do_opts_remount(sb, &opts, &do_refresh, &given); ++ //if (LktrCond) err = -1; ++ au_free_opts(&opts); ++ ++ if (do_refresh) { ++ int rerr; ++ struct aufs_sbinfo *sbinfo; ++ ++ dlgt = au_flag_test(sb, AuFlag_DLGT); ++ au_flag_clr(sb, AuFlag_DLGT); ++ au_sigen_inc(sb); ++ au_reset_hinotify(inode, au_hi_flags(inode, /*isdir*/1)); ++ sbinfo = stosi(sb); ++ sbinfo->si_failed_refresh_dirs = 0; ++ rerr = refresh_dir(root, au_sigen(sb)); ++ if (unlikely(rerr)) { ++ sbinfo->si_failed_refresh_dirs = 1; ++ Warn("Refreshing directories failed, ignores (%d)\n", ++ rerr); ++ } ++ au_cpup_attr_all(inode); ++ au_flag_set(sb, dlgt); ++ } ++ ++ aufs_write_unlock(root); ++ i_unlock(inode); ++ /* braces are added to stop a warning */ ++ if (do_refresh) { ++ sysaufs_notify_remount(); ++ } ++ ++ out_opts: ++ free_page((unsigned long)opts.opt); ++ out: ++ err = cvt_err(err); ++ TraceErr(err); ++ //au_debug_off(); ++ return err; ++} ++ ++static struct super_operations aufs_sop = { ++ .alloc_inode = aufs_alloc_inode, ++ .destroy_inode = aufs_destroy_inode, ++ .read_inode = aufs_read_inode, ++ //.dirty_inode = aufs_dirty_inode, ++ //.write_inode = aufs_write_inode, ++ //void (*put_inode) (struct inode *); ++ .drop_inode = generic_delete_inode, ++ //.delete_inode = aufs_delete_inode, ++ //.clear_inode = aufs_clear_inode, ++ ++ .show_options = aufs_show_options, ++ .statfs = aufs_statfs, ++ ++ .put_super = aufs_put_super, ++ //void (*write_super) (struct super_block *); ++ //int (*sync_fs)(struct super_block *sb, int wait); ++ //void (*write_super_lockfs) (struct super_block *); ++ //void (*unlockfs) (struct super_block *); ++ .remount_fs = aufs_remount_fs, ++ // depends upon umount flags. also use put_super() (< 2.6.18) ++ .umount_begin = aufs_umount_begin ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * at first mount time. ++ */ ++ ++static int alloc_sbinfo(struct super_block *sb) ++{ ++ struct aufs_sbinfo *sbinfo; ++ ++ TraceEnter(); ++ ++ sbinfo = kmalloc(sizeof(*sbinfo), GFP_KERNEL); ++ //if (LktrCond) {kfree(sbinfo); sbinfo = NULL;} ++ if (unlikely(!sbinfo)) ++ goto out; ++ sbinfo->si_branch = kzalloc(sizeof(*sbinfo->si_branch), GFP_KERNEL); ++ //if (LktrCond) {kfree(sbinfo->si_branch); sbinfo->si_branch = NULL;} ++ if (unlikely(!sbinfo->si_branch)) { ++ kfree(sbinfo); ++ goto out; ++ } ++ rw_init_wlock(&sbinfo->si_rwsem); ++ sbinfo->si_bend = -1; ++ atomic_long_set(&sbinfo->si_xino, AUFS_FIRST_INO); ++ spin_lock_init(&sbinfo->si_plink_lock); ++ INIT_LIST_HEAD(&sbinfo->si_plink); ++ init_lvma(sbinfo); ++ sbinfo->si_generation = 0; ++ sbinfo->si_last_br_id = 0; ++ sbinfo->si_failed_refresh_dirs = 0; ++ sbinfo->si_flags = 0; ++ sbinfo->si_dirwh = AUFS_DIRWH_DEF; ++ sbinfo->si_rdcache = AUFS_RDCACHE_DEF * HZ; ++ //atomic_set(&sbinfo->si_hinotify, 0); ++ //init_waitqueue_head(&sbinfo->si_hinotify_wq); ++ ++ sb->s_fs_info = sbinfo; ++ au_flag_set(sb, AuDefFlags); ++#ifdef ForceInotify ++ udba_set(sb, AuFlag_UDBA_INOTIFY); ++#endif ++#ifdef ForceDlgt ++ au_flag_set(sb, AuFlag_DLGT); ++#endif ++#ifdef ForceNoPlink ++ au_flag_clr(sb, AuFlag_PLINK); ++#endif ++ return 0; /* success */ ++ ++ out: ++ TraceErr(-ENOMEM); ++ return -ENOMEM; ++} ++ ++static int alloc_root(struct super_block *sb) ++{ ++ int err; ++ struct inode *inode; ++ struct dentry *root; ++ ++ TraceEnter(); ++ ++ err = -ENOMEM; ++ inode = iget(sb, AUFS_ROOT_INO); ++ //if (LktrCond) {iput(inode); inode = NULL;} ++ if (unlikely(!inode)) ++ goto out; ++ err = PTR_ERR(inode); ++ if (IS_ERR(inode)) ++ goto out; ++ err = -ENOMEM; ++ if (unlikely(is_bad_inode(inode))) ++ goto out_iput; ++ ++ root = d_alloc_root(inode); ++ //if (LktrCond) {igrab(inode); dput(root); root = NULL;} ++ if (unlikely(!root)) ++ goto out_iput; ++ err = PTR_ERR(root); ++ if (IS_ERR(root)) ++ goto out_iput; ++ ++ err = au_alloc_dinfo(root); ++ //if (LktrCond){rw_write_unlock(&dtodi(root)->di_rwsem);err=-1;} ++ if (!err) { ++ sb->s_root = root; ++ return 0; /* success */ ++ } ++ dput(root); ++ goto out; /* do not iput */ ++ ++ out_iput: ++ iput(inode); ++ out: ++ TraceErr(err); ++ return err; ++ ++} ++ ++static int aufs_fill_super(struct super_block *sb, void *raw_data, int silent) ++{ ++ int err; ++ struct dentry *root; ++ struct inode *inode; ++ struct opts opts; ++ char *arg = raw_data; ++ ++ //au_debug_on(); ++ if (unlikely(!arg || !*arg)) { ++ err = -EINVAL; ++ Err("no arg\n"); ++ goto out; ++ } ++ LKTRTrace("%s, silent %d\n", arg, silent); ++ ++ err = -ENOMEM; ++ memset(&opts, 0, sizeof(opts)); ++ opts.opt = (void*)__get_free_page(GFP_KERNEL); ++ //if (LktrCond) {free_page((unsigned long)opts.opt); opts.opt = NULL;} ++ if (unlikely(!opts.opt)) ++ goto out; ++ opts.max_opt = PAGE_SIZE / sizeof(*opts.opt); ++ ++ err = alloc_sbinfo(sb); ++ //if (LktrCond) {si_write_unlock(sb);free_sbinfo(stosi(sb));err=-1;} ++ if (unlikely(err)) ++ goto out_opts; ++ SiMustWriteLock(sb); ++ /* all timestamps always follow the ones on the branch */ ++ sb->s_flags |= MS_NOATIME | MS_NODIRATIME; ++ sb->s_op = &aufs_sop; ++ au_init_export_op(sb); ++ //err = kobj_mount(stosi(sb)); ++ //if (err) ++ //goto out_info; ++ ++ err = alloc_root(sb); ++ //if (LktrCond) {rw_write_unlock(&dtodi(sb->s_root)->di_rwsem); ++ //dput(sb->s_root);sb->s_root=NULL;err=-1;} ++ if (unlikely(err)) { ++ DEBUG_ON(sb->s_root); ++ si_write_unlock(sb); ++ goto out_info; ++ } ++ root = sb->s_root; ++ DiMustWriteLock(root); ++ inode = root->d_inode; ++ inode->i_nlink = 2; ++ ++ /* ++ * actually we can parse options regardless aufs lock here. ++ * but at remount time, parsing must be done before aufs lock. ++ * so we follow the same rule. ++ */ ++ ii_write_lock_parent(inode); ++ aufs_write_unlock(root); ++ err = au_parse_opts(sb, arg, &opts); ++ //if (LktrCond) {au_free_opts(&opts); err = -1;} ++ if (unlikely(err)) ++ goto out_root; ++ ++ /* lock vfs_inode first, then aufs. */ ++ i_lock(inode); ++ inode->i_op = &aufs_dir_iop; ++ inode->i_fop = &aufs_dir_fop; ++ aufs_write_lock(root); ++ ++ sb->s_maxbytes = 0; ++ err = au_do_opts_mount(sb, &opts); ++ //if (LktrCond) err = -1; ++ au_free_opts(&opts); ++ if (unlikely(err)) ++ goto out_unlock; ++ DEBUG_ON(!sb->s_maxbytes); ++ ++ //DbgDentry(root); ++ aufs_write_unlock(root); ++ i_unlock(inode); ++ //DbgSb(sb); ++ goto out_opts; /* success */ ++ ++ out_unlock: ++ aufs_write_unlock(root); ++ i_unlock(inode); ++ out_root: ++ dput(root); ++ sb->s_root = NULL; ++ out_info: ++ free_sbinfo(stosi(sb)); ++ sb->s_fs_info = NULL; ++ out_opts: ++ free_page((unsigned long)opts.opt); ++ out: ++ TraceErr(err); ++ err = cvt_err(err); ++ TraceErr(err); ++ //au_debug_off(); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++static int aufs_get_sb(struct file_system_type *fs_type, int flags, ++ const char *dev_name, void *raw_data, ++ struct vfsmount *mnt) ++{ ++ int err; ++ ++ /* all timestamps always follow the ones on the branch */ ++ //mnt->mnt_flags |= MNT_NOATIME | MNT_NODIRATIME; ++ err = get_sb_nodev(fs_type, flags, raw_data, aufs_fill_super, mnt); ++ if (!err) { ++ struct aufs_sbinfo *sbinfo = stosi(mnt->mnt_sb); ++ sbinfo->si_mnt = mnt; ++ sysaufs_add(sbinfo); ++ } ++ return err; ++} ++#else ++static struct super_block *aufs_get_sb(struct file_system_type *fs_type, ++ int flags, const char *dev_name, ++ void *raw_data) ++{ ++ return get_sb_nodev(fs_type, flags, raw_data, aufs_fill_super); ++} ++#endif ++ ++struct file_system_type aufs_fs_type = { ++ .name = AUFS_FSTYPE, ++ .fs_flags = FS_REVAL_DOT, // for UDBA and NFS branch ++ .get_sb = aufs_get_sb, ++ .kill_sb = generic_shutdown_super, ++ //no need to __module_get() and module_put(). ++ .owner = THIS_MODULE, ++}; +diff --git a/fs/aufs/super.h b/fs/aufs/super.h +new file mode 100755 +index 0000000..56ddee1 +--- /dev/null ++++ b/fs/aufs/super.h +@@ -0,0 +1,339 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: super.h,v 1.44 2007/05/14 03:39:54 sfjro Exp $ */ ++ ++#ifndef __AUFS_SUPER_H__ ++#define __AUFS_SUPER_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/version.h> ++#include <linux/aufs_type.h> ++#include "misc.h" ++#include "sysaufs.h" ++ ++#ifdef CONFIG_AUFS_SYSAUFS ++/* entries under sysfs per mount-point */ ++enum {SysaufsSb_XINO, /* SysaufsSb_PLINK, */ SysaufsSb_Last}; ++struct sysaufs_sbinfo { ++ au_subsys_t subsys; ++ struct sysaufs_entry array[SysaufsSb_Last]; ++}; ++extern sysaufs_op au_si_ops[]; ++#else ++struct sysaufs_sbinfo {}; ++#endif ++ ++struct aufs_sbinfo { ++ struct aufs_rwsem si_rwsem; ++ ++ /* branch management */ ++ /* wrap around attack by superuser? No. */ ++ int si_generation; ++ ++ /* ++ * set true when refresh_dirs() at remount time failed. ++ * then try refreshing dirs at access time again. ++ * if it is false, refreshing dirs at access time is unnecesary ++ */ ++ unsigned int si_failed_refresh_dirs:1; ++ ++ aufs_bindex_t si_bend; ++ aufs_bindex_t si_last_br_id; ++ struct aufs_branch **si_branch; ++ ++ /* mount flags */ ++ unsigned int si_flags; ++ ++ /* external inode number table */ ++ atomic_long_t si_xino; // time bomb ++ //struct file *si_xino_bmap; ++ ++ /* readdir cache time, max, in HZ */ ++ unsigned long si_rdcache; ++ ++ /* ++ * If the number of whiteouts are larger than si_dirwh, leave all of ++ * them after rename_whtmp to reduce the cost of rmdir(2). ++ * future fsck.aufs or kernel thread will remove them later. ++ * Otherwise, remove all whiteouts and the dir in rmdir(2). ++ */ ++ unsigned int si_dirwh; ++ ++ /* pseudo_link list */ // dirty ++ spinlock_t si_plink_lock; ++ struct list_head si_plink; ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++ /* super_blocks list is not exported */ ++ struct list_head si_list; ++ struct vfsmount *si_mnt; /* no get/put */ ++#endif ++ ++ /* sysfs */ ++ struct sysaufs_sbinfo si_sysaufs; ++ ++#ifdef CONFIG_AUFS_HINOTIFY ++ /* hinotify */ ++ //atomic_t si_hinotify; ++ //wait_queue_head_t si_hinotify_wq; ++#endif ++ ++#ifdef CONFIG_AUFS_ROBR ++ /* locked vma list for mmap() */ // very dirty ++ spinlock_t si_lvma_lock; ++ struct list_head si_lvma; ++#endif ++}; ++ ++/* an entry in a xino file */ ++struct xino { ++ ino_t ino; ++ //__u32 h_gen; ++} __attribute__ ((packed)); ++ ++//#define AuXino_INVALID_HGEN (-1) ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* Mount flags */ ++#define AuFlag_XINO 1 ++#define AuFlag_ZXINO (1 << 1) ++#define AuFlag_PLINK (1 << 2) ++#define AuFlag_UDBA_NONE (1 << 3) ++#define AuFlag_UDBA_REVAL (1 << 4) ++#define AuFlag_UDBA_INOTIFY (1 << 5) ++#define AuFlag_WARN_PERM (1 << 6) ++#define AuFlag_COO_NONE (1 << 7) ++#define AuFlag_COO_LEAF (1 << 8) ++#define AuFlag_COO_ALL (1 << 9) ++#define AuFlag_ALWAYS_DIROPQ (1 << 10) ++#define AuFlag_DLGT (1 << 11) ++ ++#define AuMask_UDBA (AuFlag_UDBA_NONE | AuFlag_UDBA_REVAL \ ++ | AuFlag_UDBA_INOTIFY) ++#define AuMask_COO (AuFlag_COO_NONE | AuFlag_COO_LEAF \ ++ | AuFlag_COO_ALL) ++ ++#ifdef CONFIG_AUFS_COMPAT ++#define AuDefFlag_DIROPQ AuFlag_ALWAYS_DIROPQ ++#else ++#define AuDefFlag_DIROPQ 0 ++#endif ++ ++#define AuDefFlags_COMM (AuFlag_XINO | AuFlag_UDBA_REVAL | AuFlag_WARN_PERM \ ++ | AuFlag_COO_NONE | AuDefFlag_DIROPQ) ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,16) ++#define AuDefFlags (AuDefFlags_COMM | AuFlag_PLINK) ++#else ++#define AuDefFlags AuDefFlags_COMM ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* flags for aufs_read_lock()/di_read_lock() */ ++#define AUFS_D_WLOCK 1 ++#define AUFS_I_RLOCK 2 ++#define AUFS_I_WLOCK 4 ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* super.c */ ++int au_show_brs(struct seq_file *seq, struct super_block *sb); ++ ++/* xino.c */ ++struct file *xino_create(struct super_block *sb, char *fname, int silent, ++ struct dentry *parent); ++ino_t xino_new_ino(struct super_block *sb); ++int xino_write0(struct super_block *sb, aufs_bindex_t bindex, ino_t h_ino); ++int xino_write(struct super_block *sb, aufs_bindex_t bindex, ino_t h_ino, ++ struct xino *xino); ++int xino_read(struct super_block *sb, aufs_bindex_t bindex, ino_t h_ino, ++ struct xino *xino); ++int xino_init(struct super_block *sb, aufs_bindex_t bindex, ++ struct file *base_file, int do_test); ++struct opt_xino; ++int xino_set(struct super_block *sb, struct opt_xino *xino, int remount); ++int xino_clr(struct super_block *sb); ++struct file *xino_def(struct super_block *sb); ++ ++/* sbinfo.c */ ++struct aufs_sbinfo *stosi(struct super_block *sb); ++aufs_bindex_t sbend(struct super_block *sb); ++struct aufs_branch *stobr(struct super_block *sb, aufs_bindex_t bindex); ++int au_sigen(struct super_block *sb); ++int au_sigen_inc(struct super_block *sb); ++int find_bindex(struct super_block *sb, struct aufs_branch *br); ++ ++void aufs_read_lock(struct dentry *dentry, int flags); ++void aufs_read_unlock(struct dentry *dentry, int flags); ++void aufs_write_lock(struct dentry *dentry); ++void aufs_write_unlock(struct dentry *dentry); ++void aufs_read_and_write_lock2(struct dentry *d1, struct dentry *d2, int isdir); ++void aufs_read_and_write_unlock2(struct dentry *d1, struct dentry *d2); ++ ++aufs_bindex_t new_br_id(struct super_block *sb); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline const char *au_sbtype(struct super_block *sb) ++{ ++ return sb->s_type->name; ++} ++ ++static inline int au_is_aufs(struct super_block *sb) ++{ ++ return !strcmp(au_sbtype(sb), AUFS_FSTYPE); ++} ++ ++static inline int au_is_nfs(struct super_block *sb) ++{ ++#if defined(CONFIG_NFS_FS) || defined(CONFIG_NFS_FS_MODULE) ++ return !strcmp(au_sbtype(sb), "nfs"); ++#else ++ return 0; ++#endif ++} ++ ++static inline int au_is_remote(struct super_block *sb) ++{ ++ return au_is_nfs(sb); ++} ++ ++#ifdef CONFIG_AUFS_EXPORT ++static inline void au_init_export_op(struct super_block *sb) ++{ ++ extern struct export_operations aufs_export_op; ++ sb->s_export_op = &aufs_export_op; ++} ++ ++static inline int au_is_nfsd(struct task_struct *tsk) ++{ ++ return (!tsk->mm && !strcmp(tsk->comm, "nfsd")); ++} ++ ++static inline void au_nfsd_lockdep_off(void) ++{ ++ /* braces are added to stop a warning */ ++ if (au_is_nfsd(current)) { ++ lockdep_off(); ++ } ++} ++ ++static inline void au_nfsd_lockdep_on(void) ++{ ++ /* braces are added to stop a warning */ ++ if (au_is_nfsd(current)) { ++ lockdep_on(); ++ } ++} ++#else ++static inline int au_is_nfsd(struct task_struct *tsk) ++{ ++ return 0; ++} ++static inline void au_init_export_op(struct super_block *sb) ++{ ++ /* nothing */ ++} ++#define au_nfsd_lockdep_off() /* */ ++#define au_nfsd_lockdep_on() /* */ ++#endif /* CONFIG_AUFS_EXPORT */ ++ ++static inline void init_lvma(struct aufs_sbinfo *sbinfo) ++{ ++#ifdef CONFIG_AUFS_ROBR ++ spin_lock_init(&sbinfo->si_lvma_lock); ++ INIT_LIST_HEAD(&sbinfo->si_lvma); ++#else ++ /* nothing */ ++#endif ++} ++ ++/* limited support before 2.6.18 */ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,18) ++static inline void au_mntget(struct super_block *sb) ++{ ++ mntget(stosi(sb)->si_mnt); ++} ++ ++static inline void au_mntput(struct super_block *sb) ++{ ++ mntput(stosi(sb)->si_mnt); ++} ++#else ++static inline void au_mntget(struct super_block *sb) ++{ ++ /* empty */ ++} ++ ++static inline void au_mntput(struct super_block *sb) ++{ ++ /* empty */ ++} ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline void au_flag_set(struct super_block *sb, unsigned int flag) ++{ ++ //SiMustWriteLock(sb); ++ stosi(sb)->si_flags |= flag; ++} ++ ++static inline void au_flag_clr(struct super_block *sb, unsigned int flag) ++{ ++ //SiMustWriteLock(sb); ++ stosi(sb)->si_flags &= ~flag; ++} ++ ++static inline ++unsigned int au_flag_test(struct super_block *sb, unsigned int flag) ++{ ++ //SiMustAnyLock(sb); ++ return stosi(sb)->si_flags & flag; ++} ++ ++static inline unsigned int au_flag_test_udba(struct super_block *sb) ++{ ++ return au_flag_test(sb, AuMask_UDBA); ++} ++ ++static inline unsigned int au_flag_test_coo(struct super_block *sb) ++{ ++ return au_flag_test(sb, AuMask_COO); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* lock superblock. mainly for entry point functions */ ++/* ++ * si_read_lock, si_write_lock, ++ * si_read_unlock, si_write_unlock, si_downgrade_lock ++ */ ++SimpleRwsemFuncs(si, struct super_block *sb, stosi(sb)->si_rwsem); ++ ++/* to debug easier, do not make them inlined functions */ ++#define SiMustReadLock(sb) RwMustReadLock(&stosi(sb)->si_rwsem) ++#define SiMustWriteLock(sb) RwMustWriteLock(&stosi(sb)->si_rwsem) ++#define SiMustAnyLock(sb) RwMustAnyLock(&stosi(sb)->si_rwsem) ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_SUPER_H__ */ +diff --git a/fs/aufs/sysaufs.c b/fs/aufs/sysaufs.c +new file mode 100755 +index 0000000..d686862 +--- /dev/null ++++ b/fs/aufs/sysaufs.c +@@ -0,0 +1,620 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: sysaufs.c,v 1.6 2007/05/14 03:40:10 sfjro Exp $ */ ++ ++#include <linux/module.h> ++#include <linux/seq_file.h> ++#include <linux/sysfs.h> ++#include "aufs.h" ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* super_blocks list is not exported */ ++static DEFINE_MUTEX(aufs_sbilist_mtx); ++static LIST_HEAD(aufs_sbilist); ++ ++/* ---------------------------------------------------------------------- */ ++ ++typedef ssize_t (*rwfunc_t)(struct kobject *kobj, char *buf, loff_t offset, ++ size_t sz, struct sysaufs_args *args); ++static ssize_t sysaufs_read(struct kobject *kobj, char *buf, loff_t offset, ++ size_t sz, struct sysaufs_args *args); ++static ssize_t sysaufs_free_write(struct kobject *kobj, char *buf, loff_t ++ offset, size_t sz, struct sysaufs_args *args); ++ ++#define GFunc(name, _index, func) \ ++static ssize_t name(struct kobject *kobj, char *buf, loff_t offset, size_t sz) \ ++{ \ ++ struct sysaufs_args args = { \ ++ .index = (_index), \ ++ .mtx = &aufs_sbilist_mtx, \ ++ .sb = NULL \ ++ }; \ ++ return func(kobj, buf, offset, sz, &args); \ ++} ++ ++#define GFuncs(name, _index) \ ++ GFunc(read_##name, _index, sysaufs_read); \ ++ GFunc(write_##name, _index, sysaufs_free_write); ++ ++static struct super_block *find_sb_locked(struct kobject *kobj) ++{ ++ struct super_block *sb; ++ struct aufs_sbinfo *sbinfo; ++ ++ TraceEnter(); ++ MtxMustLock(&aufs_sbilist_mtx); ++ ++ sb = NULL; ++ list_for_each_entry(sbinfo, &aufs_sbilist, si_list) { ++ if (&au_subsys_to_kset(sbinfo->si_sysaufs.subsys).kobj != kobj) ++ continue; ++ sb = sbinfo->si_mnt->mnt_sb; ++ si_read_lock(sb); ++ break; ++ } ++ return sb; ++} ++ ++static ssize_t sb_func(struct kobject *kobj, char *buf, loff_t offset, ++ size_t sz, struct sysaufs_args *args, rwfunc_t func) ++{ ++ ssize_t err; ++ ++ err = -ENOENT; ++ mutex_lock(&aufs_sbilist_mtx); ++ args->sb = find_sb_locked(kobj); ++ if (args->sb) { ++ err = func(kobj, buf, offset, sz, args); ++ si_read_unlock(args->sb); ++ } ++ mutex_unlock(&aufs_sbilist_mtx); ++ return err; ++} ++ ++#define SbFunc(name, _index, func) \ ++static ssize_t name(struct kobject *kobj, char *buf, loff_t offset, size_t sz) \ ++{ \ ++ struct sysaufs_args args = { \ ++ .index = (_index), \ ++ .mtx = NULL \ ++ }; \ ++ return sb_func(kobj, buf, offset, sz, &args, func); \ ++} ++ ++#define SbFuncs(name, index) \ ++ SbFunc(read_##name, index, sysaufs_read); \ ++ SbFunc(write_##name, index, sysaufs_free_write) ++ ++static decl_subsys(aufs, NULL, NULL); ++enum {Brs, Stat, Config, _Last}; ++static struct sysaufs_entry g_array[_Last]; ++GFuncs(brs, Brs); ++GFuncs(stat, Stat); ++GFuncs(config, Config); ++ ++SbFuncs(xino, SysaufsSb_XINO); ++ ++#define SetEntry(e, _name, init_size, _ops) \ ++ do { \ ++ (e)->attr.attr.name = #_name; \ ++ (e)->attr.attr.owner = THIS_MODULE; \ ++ (e)->attr.attr.mode = S_IRUGO | S_IWUSR; \ ++ (e)->attr.read = read_##_name; \ ++ (e)->attr.write = write_##_name; \ ++ (e)->allocated = init_size; \ ++ (e)->err = -1; \ ++ (e)->ops = _ops; \ ++ } while (0) ++ ++#define Priv(e) (e)->attr.private ++#define Allocated(e) (e)->allocated ++#define Len(e) (e)->attr.size ++#define Name(e) attr_name((e)->attr) ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void free_entry(struct sysaufs_entry *e) ++{ ++ MtxMustLock(&aufs_sbilist_mtx); ++ DEBUG_ON(!Priv(e)); ++ ++ if (Allocated(e) > 0) ++ kfree(Priv(e)); ++ else ++ free_pages((unsigned long)Priv(e), -Allocated(e)); ++ Priv(e) = NULL; ++ Len(e) = 0; ++} ++ ++static void free_entries(void) ++{ ++ static int a[] = {Brs, -1}; ++ int *p = a; ++ ++ MtxMustLock(&aufs_sbilist_mtx); ++ ++ while (*p >= 0) { ++ if (Priv(g_array + *p)) ++ free_entry(g_array + *p); ++ p++; ++ } ++} ++ ++static int alloc_entry(struct sysaufs_entry *e) ++{ ++ MtxMustLock(&aufs_sbilist_mtx); ++ DEBUG_ON(Priv(e)); ++ //Dbg("%d\n", Allocated(e)); ++ ++ if (Allocated(e) > 0) ++ Priv(e) = kmalloc(Allocated(e), GFP_KERNEL); ++ else ++ Priv(e) = (void*)__get_free_pages(GFP_KERNEL, -Allocated(e)); ++ if (Priv(e)) ++ return 0; ++ return -ENOMEM; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void unreg(au_subsys_t *subsys, struct sysaufs_entry *a, int n, ++ au_subsys_t *parent) ++{ ++ int i; ++ ++ TraceEnter(); ++ ++ for (i = 0; i < n; i++, a++) ++ if (!a->err) { ++ sysfs_remove_bin_file ++ (&au_subsys_to_kset(*subsys).kobj, &a->attr); ++ if (Priv(a)) ++ free_entry(a); ++ } ++ ++ subsystem_unregister(subsys); ++ subsys_put(parent); ++} ++ ++static int reg(au_subsys_t *subsys, struct sysaufs_entry *a, int n, ++ au_subsys_t *parent) ++{ ++ int err, i; ++ ++ TraceEnter(); ++ ++ subsys_get(parent); ++ kobj_set_kset_s(&au_subsys_to_kset(*subsys), *parent); ++ err = subsystem_register(subsys); ++ if (unlikely(err)) ++ goto out; ++ ++ for (i = 0; !err && i < n; i++) ++ err = a[i].err = sysfs_create_bin_file ++ (&au_subsys_to_kset(*subsys).kobj, &a[i].attr); ++ if (unlikely(err)) ++ unreg(subsys, a, n, parent); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#define SbSetEntry(index, name, init_size) \ ++ SetEntry(sa->array + index, name, init_size, au_si_ops); ++ ++void sysaufs_add(struct aufs_sbinfo *sbinfo) ++{ ++ int err; ++ struct sysaufs_sbinfo *sa = &sbinfo->si_sysaufs; ++ ++ TraceEnter(); ++ ++ mutex_lock(&aufs_sbilist_mtx); ++ list_add_tail(&sbinfo->si_list, &aufs_sbilist); ++ free_entries(); ++ ++ memset(sa, 0, sizeof(*sa)); ++ SbSetEntry(SysaufsSb_XINO, xino, 128); ++ err = kobject_set_name(&au_subsys_to_kset(sa->subsys).kobj, "%p", ++ sbinfo->si_mnt->mnt_sb); ++ if (!err) ++ err = reg(&sa->subsys, sa->array, ARRAY_SIZE(sa->array), ++ &aufs_subsys); ++ if (unlikely(err)) ++ Warn("failed adding sysfs (%d)\n", err); ++ ++ mutex_unlock(&aufs_sbilist_mtx); ++} ++ ++void sysaufs_del(struct aufs_sbinfo *sbinfo) ++{ ++ struct sysaufs_sbinfo *sa = &sbinfo->si_sysaufs; ++ ++ TraceEnter(); ++ ++ mutex_lock(&aufs_sbilist_mtx); ++ unreg(&sa->subsys, sa->array, ARRAY_SIZE(sa->array), &aufs_subsys); ++ list_del(&sbinfo->si_list); ++ free_entries(); ++ mutex_unlock(&aufs_sbilist_mtx); ++} ++ ++void sysaufs_notify_remount(void) ++{ ++ mutex_lock(&aufs_sbilist_mtx); ++ free_entries(); ++ mutex_unlock(&aufs_sbilist_mtx); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int make_brs(struct seq_file *seq, struct sysaufs_args *args, ++ int *do_size) ++{ ++ int err; ++ struct aufs_sbinfo *sbinfo; ++ ++ TraceEnter(); ++ MtxMustLock(&aufs_sbilist_mtx); ++ DEBUG_ON(args->index != Brs); ++ ++ err = 0; ++ list_for_each_entry(sbinfo, &aufs_sbilist, si_list) { ++ struct super_block *sb; ++ struct dentry *root; ++ struct vfsmount *mnt; ++ ++ sb = sbinfo->si_mnt->mnt_sb; ++ root = sb->s_root; ++ aufs_read_lock(root, !AUFS_I_RLOCK); ++ mnt = sbinfo->si_mnt; ++ err = seq_escape ++ (seq, mnt->mnt_devname ? mnt->mnt_devname : "none", ++ au_esc_chars); ++ if (!err) ++ err = seq_putc(seq, ' '); ++ if (!err) ++ err = seq_path(seq, mnt, root, au_esc_chars); ++ if (err > 0) ++ err = seq_printf(seq, " %p br:", sb); ++ if (!err) ++ err = au_show_brs(seq, sb); ++ aufs_read_unlock(root, !AUFS_I_RLOCK); ++ if (!err) ++ err = seq_putc(seq, '\n'); ++ else ++ break; ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int make_config(struct seq_file *seq, struct sysaufs_args *args, ++ int *do_size) ++{ ++ int err; ++ ++ TraceEnter(); ++ DEBUG_ON(args->index != Config); ++ ++#ifdef CONFIG_AUFS ++ err = seq_puts(seq, "CONFIG_AUFS=y\n"); ++#else ++ err = seq_puts(seq, "CONFIG_AUFS=m\n"); ++#endif ++ ++#define puts(m, v) \ ++ if (!err) err = seq_puts(seq, "CONFIG_AUFS_" #m "=" #v "\n") ++#define puts_bool(m) puts(m, y) ++#define puts_mod(m) puts(m, m) ++ ++#ifdef CONFIG_AUFS_FAKE_DM ++ puts_bool(FAKE_DM); ++#endif ++#ifdef CONFIG_AUFS_BRANCH_MAX_127 ++ puts_bool(BRANCH_MAX_127); ++#elif defined(CONFIG_AUFS_BRANCH_MAX_511) ++ puts_bool(BRANCH_MAX_511); ++#elif defined(CONFIG_AUFS_BRANCH_MAX_1023) ++ puts_bool(BRANCH_MAX_1023); ++#elif defined(CONFIG_AUFS_BRANCH_MAX_32767) ++ puts_bool(BRANCH_MAX_32767); ++#endif ++ puts_bool(SYSAUFS); ++#ifdef CONFIG_AUFS_HINOTIFY ++ puts_bool(HINOTIFY); ++#endif ++#ifdef CONFIG_AUFS_EXPORT ++ puts_bool(EXPORT); ++#endif ++#ifdef CONFIG_AUFS_ROBR ++ puts_bool(ROBR); ++#endif ++#ifdef CONFIG_AUFS_DLGT ++ puts_bool(DLGT); ++#endif ++#ifdef CONFIG_AUFS_LHASH_PATCH ++ puts_bool(LHASH_PATCH); ++#endif ++#ifdef CONFIG_AUFS_KSIZE_PATCH ++ puts_bool(KSIZE_PATCH); ++#endif ++#ifdef CONFIG_AUFS_DEBUG ++ puts_bool(DEBUG); ++#endif ++#ifdef CONFIG_AUFS_COMPAT ++ puts_bool(COMPAT); ++#endif ++ ++#undef puts_bool ++#undef puts ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int make_stat(struct seq_file *seq, struct sysaufs_args *args, ++ int *do_size) ++{ ++ int err, i; ++ ++ TraceEnter(); ++ DEBUG_ON(args->index != Stat); ++ ++ *do_size = 0; ++ err = seq_puts(seq, "wkq max_busy:"); ++ for (i = 0; !err && i < aufs_nwkq; i++) ++ err = seq_printf(seq, " %u", au_wkq[i].max_busy); ++ if (!err) ++ err = seq_printf(seq, ", %u(generic)\n", ++ au_wkq[aufs_nwkq].max_busy); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static int make(struct sysaufs_entry *e, struct sysaufs_args *args, ++ int *do_size) ++ ++{ ++ int err; ++ struct seq_file *seq; ++ ++ TraceEnter(); ++ DEBUG_ON(Priv(e)); ++ MtxMustLock(&aufs_sbilist_mtx); ++ ++ err = -ENOMEM; ++ seq = kzalloc(sizeof(*seq), GFP_KERNEL); ++ if (unlikely(!seq)) ++ goto out; ++ ++ Len(e) = 0; ++ while (1) { ++ err = alloc_entry(e); ++ if (unlikely(err)) ++ break; ++ ++ //mutex_init(&seq.lock); ++ seq->buf = Priv(e); ++ seq->count = 0; ++ seq->size = Allocated(e); ++ if (unlikely(Allocated(e) <= 0)) ++ seq->size = PAGE_SIZE << -Allocated(e); ++ ++ err = e->ops[args->index](seq, args, do_size); ++ if (!err) { ++ Len(e) = seq->count; ++ break; /* success */ ++ } ++ ++ free_entry(e); ++ if (Allocated(e) > 0) { ++ Allocated(e) <<= 1; ++ if (unlikely(Allocated(e) >= (int)PAGE_SIZE)) ++ Allocated(e) = 0; ++ } else ++ Allocated(e)--; ++ //Dbg("%d\n", Allocated(e)); ++ } ++ kfree(seq); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* why does sysfs pass my parent kobject? */ ++static struct dentry *find_me(struct dentry *parent, struct sysaufs_entry *e) ++{ ++#if 1 ++ struct dentry *dentry; ++ const char *name = Name(e); ++ const unsigned int len = strlen(name); ++ ++ //Dbg("%.*s\n", DLNPair(parent)); ++ spin_lock(&dcache_lock); ++ list_for_each_entry(dentry, &parent->d_subdirs, D_CHILD) { ++ //Dbg("%.*s\n", DLNPair(dentry)); ++ if (len == dentry->d_name.len ++ && !strcmp(dentry->d_name.name, name)) { ++ spin_unlock(&dcache_lock); ++ return dentry; ++ } ++ } ++ spin_unlock(&dcache_lock); ++#endif ++ return NULL; ++} ++ ++static ssize_t sysaufs_read(struct kobject *kobj, char *buf, loff_t offset, ++ size_t sz, struct sysaufs_args *args) ++{ ++ ssize_t err; ++ loff_t len; ++ struct dentry *d; ++ struct sysaufs_entry *e; ++ int do_size; ++ ++ LKTRTrace("{%d, %p}, offset %Ld, sz %lu\n", ++ args->index, args->sb, offset, (unsigned long)sz); ++ ++ if (unlikely(!sz)) ++ return 0; ++ ++ err = 0; ++ d = NULL; ++ e = g_array + args->index; ++ if (args->sb) ++ e = stosi(args->sb)->si_sysaufs.array + args->index; ++ ++ do_size = 1; ++ if (args->mtx) ++ mutex_lock(args->mtx); ++ if (unlikely(!Priv(e))) { ++ err = make(e, args, &do_size); ++ DEBUG_ON(Len(e) > INT_MAX); ++ if (do_size) { ++ d = find_me(kobj->dentry, e); ++ if (d) ++ i_size_write(d->d_inode, Len(e)); ++ } ++ } ++ ++ if (!err) { ++ err = len = Len(e) - offset; ++ LKTRTrace("%Ld\n", len); ++ if (len > 0) { ++ if (len > sz) ++ err = sz; ++ memcpy(buf, Priv(e) + offset, err); ++ } ++ ++ if (!do_size) ++ free_entry(e); ++ } ++ if (args->mtx) ++ mutex_unlock(args->mtx); ++ ++ TraceErr(err); ++ return err; ++} ++ ++static ssize_t sysaufs_free_write(struct kobject *kobj, char *buf, ++ loff_t offset, size_t sz, ++ struct sysaufs_args *args) ++{ ++ struct dentry *d; ++ int allocated, len; ++ struct sysaufs_entry *e; ++ ++ LKTRTrace("{%d, %p}\n", args->index, args->sb); ++ ++ e = g_array + args->index; ++ if (args->sb) ++ e = stosi(args->sb)->si_sysaufs.array + args->index; ++ ++ if (args->mtx) ++ mutex_lock(args->mtx); ++ if (Priv(e)) { ++ allocated = Allocated(e); ++ if (unlikely(allocated <= 0)) ++ allocated = PAGE_SIZE << -allocated; ++ allocated >>= 1; ++ len = Len(e); ++ ++ free_entry(e); ++ if (unlikely(len <= allocated)) { ++ if (Allocated(e) >= 0) ++ Allocated(e) = allocated; ++ else ++ Allocated(e)++; ++ } ++ ++ d = find_me(kobj->dentry, e); ++ if (d && i_size_read(d->d_inode)) ++ i_size_write(d->d_inode, 0); ++ } ++ if (args->mtx) ++ mutex_unlock(args->mtx); ++ ++ return sz; ++} ++ ++static sysaufs_op g_ops[] = { ++ [Brs] = make_brs, ++ [Stat] = make_stat, ++ [Config] = make_config ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++#define GSetEntry(index, name, init_size) \ ++ SetEntry(g_array + index, name, init_size, g_ops) ++ ++int __init sysaufs_init(void) ++{ ++ int err; ++ ++ GSetEntry(Brs, brs, 128); ++ GSetEntry(Stat, stat, 32); ++ GSetEntry(Config, config, 256); ++ err = reg(&aufs_subsys, g_array, ARRAY_SIZE(g_array), &fs_subsys); ++ TraceErr(err); ++ return err; ++} ++ ++void __exit sysaufs_fin(void) ++{ ++ mutex_lock(&aufs_sbilist_mtx); ++ unreg(&aufs_subsys, g_array, ARRAY_SIZE(g_array), &fs_subsys); ++ mutex_unlock(&aufs_sbilist_mtx); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef DbgDlgt ++int is_branch(struct super_block *h_sb) ++{ ++ int found = 0; ++ struct aufs_sbinfo *sbinfo; ++ ++ //Dbg("here\n"); ++ mutex_lock(&aufs_sbilist_mtx); ++ list_for_each_entry(sbinfo, &aufs_sbilist, si_list) { ++ aufs_bindex_t bindex, bend; ++ struct super_block *sb; ++ ++ sb = sbinfo->si_mnt->mnt_sb; ++ si_read_lock(sb); ++ bend = sbend(sb); ++ for (bindex = 0; !found && bindex <= bend; bindex++) ++ found = (h_sb == sbr_sb(sb, bindex)); ++ si_read_unlock(sb); ++ } ++ mutex_unlock(&aufs_sbilist_mtx); ++ return found; ++} ++#endif +diff --git a/fs/aufs/sysaufs.h b/fs/aufs/sysaufs.h +new file mode 100755 +index 0000000..cf0247f +--- /dev/null ++++ b/fs/aufs/sysaufs.h +@@ -0,0 +1,83 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: sysaufs.h,v 1.3 2007/05/14 06:27:18 sfjro Exp $ */ ++ ++#ifndef __SYSAUFS_H__ ++#define __SYSAUFS_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/seq_file.h> ++#include <linux/sysfs.h> ++#include <linux/version.h> ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,22) ++typedef struct kset au_subsys_t; ++#define au_subsys_to_kset(subsys) (subsys) ++#else ++typedef struct subsystem au_subsys_t; ++#define au_subsys_to_kset(subsys) ((subsys).kset) ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* arguments for an entry under sysfs */ ++struct sysaufs_args { ++ int index; ++ struct mutex *mtx; ++ struct super_block *sb; ++}; ++ ++typedef int (*sysaufs_op)(struct seq_file *seq, struct sysaufs_args *args, ++ int *do_size); ++ ++/* an entry under sysfs */ ++struct sysaufs_entry { ++ struct bin_attribute attr; ++ int allocated; /* zero minus means pages */ ++ int err; ++ sysaufs_op *ops; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct aufs_sbinfo; ++#ifdef CONFIG_AUFS_SYSAUFS ++void sysaufs_add(struct aufs_sbinfo *sbinfo); ++void sysaufs_del(struct aufs_sbinfo *sbinfo); ++int __init sysaufs_init(void); ++void sysaufs_fin(void); ++void sysaufs_notify_remount(void); ++#else ++static inline void sysaufs_add(struct aufs_sbinfo *sbinfo) ++{ ++ /* nothing */ ++} ++ ++static inline void sysaufs_del(struct aufs_sbinfo *sbinfo) ++{ ++ /* nothing */ ++} ++#define sysaufs_init() 0 ++#define sysaufs_fin() /* */ ++#define sysaufs_notify_remount() /* */ ++#endif /* CONFIG_AUFS_SYSAUFS */ ++ ++#endif /* __KERNEL__ */ ++#endif /* __SYSAUFS_H__ */ +diff --git a/fs/aufs/vdir.c b/fs/aufs/vdir.c +new file mode 100755 +index 0000000..8e99b7d +--- /dev/null ++++ b/fs/aufs/vdir.c +@@ -0,0 +1,802 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: vdir.c,v 1.22 2007/05/14 03:38:52 sfjro Exp $ */ ++ ++#include "aufs.h" ++ ++static int calc_size(int namelen) ++{ ++ int sz; ++ ++ sz = sizeof(struct aufs_de) + namelen; ++ if (sizeof(ino_t) == sizeof(long)) { ++ const int mask = sizeof(ino_t) - 1; ++ if (sz & mask) { ++ sz += sizeof(ino_t); ++ sz &= ~mask; ++ } ++ } else { ++#if 0 // remove ++ BUG(); ++ // this block will be discarded by optimizer. ++ int m; ++ m = sz % sizeof(ino_t); ++ if (m) ++ sz += sizeof(ino_t) - m; ++#endif ++ } ++ ++ DEBUG_ON(sz % sizeof(ino_t)); ++ return sz; ++} ++ ++static int set_deblk_end(union aufs_deblk_p *p, union aufs_deblk_p *deblk_end) ++{ ++ if (calc_size(0) <= deblk_end->p - p->p) { ++ p->de->de_str.len = 0; ++ //smp_mb(); ++ return 0; ++ } ++ return -1; // error ++} ++ ++/* returns true or false */ ++static int is_deblk_end(union aufs_deblk_p *p, union aufs_deblk_p *deblk_end) ++{ ++ if (calc_size(0) <= deblk_end->p - p->p) ++ return !p->de->de_str.len; ++ return 1; ++} ++ ++static aufs_deblk_t *last_deblk(struct aufs_vdir *vdir) ++{ ++ return vdir->vd_deblk[vdir->vd_nblk - 1]; ++} ++ ++void nhash_init(struct aufs_nhash *nhash) ++{ ++ int i; ++ for (i = 0; i < AUFS_NHASH_SIZE; i++) ++ INIT_HLIST_HEAD(nhash->heads + i); ++} ++ ++struct aufs_nhash *nhash_new(gfp_t gfp) ++{ ++ struct aufs_nhash *nhash; ++ ++ nhash = kmalloc(sizeof(*nhash), gfp); ++ if (nhash) { ++ nhash_init(nhash); ++ return nhash; ++ } ++ return ERR_PTR(-ENOMEM); ++} ++ ++void nhash_del(struct aufs_nhash *nhash) ++{ ++ nhash_fin(nhash); ++ kfree(nhash); ++} ++ ++void nhash_move(struct aufs_nhash *dst, struct aufs_nhash *src) ++{ ++ int i; ++ ++ TraceEnter(); ++ ++ //DbgWhlist(src); ++ *dst = *src; ++ for (i = 0; i < AUFS_NHASH_SIZE; i++) { ++ struct hlist_head *h; ++ h = dst->heads + i; ++ if (h->first) ++ h->first->pprev = &h->first; ++ INIT_HLIST_HEAD(src->heads + i); ++ } ++ //DbgWhlist(src); ++ //DbgWhlist(dst); ++ //smp_mb(); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++void nhash_fin(struct aufs_nhash *whlist) ++{ ++ int i; ++ struct hlist_head *head; ++ struct aufs_wh *tpos; ++ struct hlist_node *pos, *n; ++ ++ TraceEnter(); ++ ++ for (i = 0; i < AUFS_NHASH_SIZE; i++) { ++ head = whlist->heads + i; ++ hlist_for_each_entry_safe(tpos, pos, n, head, wh_hash) { ++ //hlist_del(pos); ++ kfree(tpos); ++ } ++ } ++} ++ ++int is_longer_wh(struct aufs_nhash *whlist, aufs_bindex_t btgt, int limit) ++{ ++ int n, i; ++ struct hlist_head *head; ++ struct aufs_wh *tpos; ++ struct hlist_node *pos; ++ ++ LKTRTrace("limit %d\n", limit); ++ //return 1; ++ ++ n = 0; ++ for (i = 0; i < AUFS_NHASH_SIZE; i++) { ++ head = whlist->heads + i; ++ hlist_for_each_entry(tpos, pos, head, wh_hash) ++ if (tpos->wh_bindex == btgt && ++n > limit) ++ return 1; ++ } ++ return 0; ++} ++ ++/* returns found(true) or not */ ++int test_known_wh(struct aufs_nhash *whlist, char *name, int namelen) ++{ ++ struct hlist_head *head; ++ struct aufs_wh *tpos; ++ struct hlist_node *pos; ++ struct aufs_destr *str; ++ ++ LKTRTrace("%.*s\n", namelen, name); ++ ++ head = whlist->heads + au_name_hash(name, namelen); ++ hlist_for_each_entry(tpos, pos, head, wh_hash) { ++ str = &tpos->wh_str; ++ LKTRTrace("%.*s\n", str->len, str->name); ++ if (str->len == namelen && !memcmp(str->name, name, namelen)) ++ return 1; ++ } ++ return 0; ++} ++ ++int append_wh(struct aufs_nhash *whlist, char *name, int namelen, ++ aufs_bindex_t bindex) ++{ ++ int err; ++ struct aufs_destr *str; ++ struct aufs_wh *wh; ++ ++ LKTRTrace("%.*s\n", namelen, name); ++ ++ err = -ENOMEM; ++ wh = kmalloc(sizeof(*wh) + namelen, GFP_KERNEL); ++ if (unlikely(!wh)) ++ goto out; ++ err = 0; ++ wh->wh_bindex = bindex; ++ str = &wh->wh_str; ++ str->len = namelen; ++ memcpy(str->name, name, namelen); ++ hlist_add_head(&wh->wh_hash, ++ whlist->heads + au_name_hash(name, namelen)); ++ //smp_mb(); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++void free_vdir(struct aufs_vdir *vdir) ++{ ++ aufs_deblk_t **deblk; ++ ++ TraceEnter(); ++ ++ deblk = vdir->vd_deblk; ++ while (vdir->vd_nblk--) { ++ kfree(*deblk); ++ deblk++; ++ } ++ kfree(vdir->vd_deblk); ++ cache_free_vdir(vdir); ++} ++ ++static int append_deblk(struct aufs_vdir *vdir) ++{ ++ int err, sz, i; ++ aufs_deblk_t **o; ++ union aufs_deblk_p p, deblk_end; ++ ++ TraceEnter(); ++ ++ err = -ENOMEM; ++ sz = sizeof(*o) * vdir->vd_nblk; ++ o = au_kzrealloc(vdir->vd_deblk, sz, sz + sizeof(*o), GFP_KERNEL); ++ if (unlikely(!o)) ++ goto out; ++ vdir->vd_deblk = o; ++ p.deblk = kmalloc(sizeof(*p.deblk), GFP_KERNEL); ++ if (p.deblk) { ++ i = vdir->vd_nblk++; ++ vdir->vd_deblk[i] = p.deblk; ++ vdir->vd_last.i = i; ++ vdir->vd_last.p.p = p.p; ++ deblk_end.deblk = p.deblk + 1; ++ err = set_deblk_end(&p, &deblk_end); ++ DEBUG_ON(err); ++ } ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static struct aufs_vdir *alloc_vdir(void) ++{ ++ struct aufs_vdir *vdir; ++ int err; ++ ++ TraceEnter(); ++ ++ err = -ENOMEM; ++ vdir = cache_alloc_vdir(); ++ if (unlikely(!vdir)) ++ goto out; ++ vdir->vd_deblk = kzalloc(sizeof(*vdir->vd_deblk), GFP_KERNEL); ++ if (unlikely(!vdir->vd_deblk)) ++ goto out_free; ++ ++ vdir->vd_nblk = 0; ++ vdir->vd_version = 0; ++ vdir->vd_jiffy = 0; ++ err = append_deblk(vdir); ++ if (!err) ++ return vdir; /* success */ ++ ++ kfree(vdir->vd_deblk); ++ ++ out_free: ++ cache_free_vdir(vdir); ++ out: ++ vdir = ERR_PTR(err); ++ TraceErrPtr(vdir); ++ return vdir; ++} ++ ++static int reinit_vdir(struct aufs_vdir *vdir) ++{ ++ int err; ++ union aufs_deblk_p p, deblk_end; ++ ++ TraceEnter(); ++ ++ while (vdir->vd_nblk > 1) { ++ kfree(vdir->vd_deblk[vdir->vd_nblk - 1]); ++ vdir->vd_deblk[vdir->vd_nblk - 1] = NULL; ++ vdir->vd_nblk--; ++ } ++ p.deblk = vdir->vd_deblk[0]; ++ deblk_end.deblk = p.deblk + 1; ++ err = set_deblk_end(&p, &deblk_end); ++ DEBUG_ON(err); ++ vdir->vd_version = 0; ++ vdir->vd_jiffy = 0; ++ vdir->vd_last.i = 0; ++ vdir->vd_last.p.deblk = vdir->vd_deblk[0]; ++ //smp_mb(); ++ //DbgVdir(vdir); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void free_dehlist(struct aufs_nhash *dehlist) ++{ ++ int i; ++ struct hlist_head *head; ++ struct aufs_dehstr *tpos; ++ struct hlist_node *pos, *n; ++ ++ TraceEnter(); ++ ++ for (i = 0; i < AUFS_NHASH_SIZE; i++) { ++ head = dehlist->heads + i; ++ hlist_for_each_entry_safe(tpos, pos, n, head, hash) { ++ //hlist_del(pos); ++ cache_free_dehstr(tpos); ++ } ++ } ++} ++ ++/* returns found(true) or not */ ++static int test_known(struct aufs_nhash *delist, char *name, int namelen) ++{ ++ struct hlist_head *head; ++ struct aufs_dehstr *tpos; ++ struct hlist_node *pos; ++ struct aufs_destr *str; ++ ++ LKTRTrace("%.*s\n", namelen, name); ++ ++ head = delist->heads + au_name_hash(name, namelen); ++ hlist_for_each_entry(tpos, pos, head, hash) { ++ str = tpos->str; ++ LKTRTrace("%.*s\n", str->len, str->name); ++ if (str->len == namelen && !memcmp(str->name, name, namelen)) ++ return 1; ++ } ++ return 0; ++ ++} ++ ++static int append_de(struct aufs_vdir *vdir, char *name, int namelen, ino_t ino, ++ unsigned int d_type, struct aufs_nhash *delist) ++{ ++ int err, sz; ++ union aufs_deblk_p p, *room, deblk_end; ++ struct aufs_dehstr *dehstr; ++ ++ LKTRTrace("%.*s %d, i%lu, dt%u\n", namelen, name, namelen, ino, d_type); ++ ++ p.deblk = last_deblk(vdir); ++ deblk_end.deblk = p.deblk + 1; ++ room = &vdir->vd_last.p; ++ DEBUG_ON(room->p < p.p || deblk_end.p <= room->p ++ || !is_deblk_end(room, &deblk_end)); ++ ++ sz = calc_size(namelen); ++ if (unlikely(sz > deblk_end.p - room->p)) { ++ err = append_deblk(vdir); ++ if (unlikely(err)) ++ goto out; ++ p.deblk = last_deblk(vdir); ++ deblk_end.deblk = p.deblk + 1; ++ //smp_mb(); ++ DEBUG_ON(room->p != p.p); ++ } ++ ++ err = -ENOMEM; ++ dehstr = cache_alloc_dehstr(); ++ if (unlikely(!dehstr)) ++ goto out; ++ dehstr->str = &room->de->de_str; ++ hlist_add_head(&dehstr->hash, ++ delist->heads + au_name_hash(name, namelen)); ++ ++ room->de->de_ino = ino; ++ room->de->de_type = d_type; ++ room->de->de_str.len = namelen; ++ memcpy(room->de->de_str.name, name, namelen); ++ ++ err = 0; ++ room->p += sz; ++ if (unlikely(set_deblk_end(room, &deblk_end))) ++ err = append_deblk(vdir); ++ //smp_mb(); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct fillvdir_arg { ++ struct file *file; ++ struct aufs_vdir *vdir; ++ struct aufs_nhash *delist; ++ struct aufs_nhash *whlist; ++ aufs_bindex_t bindex; ++ int err; ++ int called; ++}; ++ ++static int fillvdir(void *__arg, const char *__name, int namelen, loff_t offset, ++ filldir_ino_t h_ino, unsigned int d_type) ++{ ++ struct fillvdir_arg *arg = __arg; ++ char *name = (void*)__name; ++ aufs_bindex_t bindex, bend; ++ struct xino xino; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, namelen %d, i%Lu, dt%u\n", ++ namelen, name, namelen, (u64)h_ino, d_type); ++ ++ sb = arg->file->f_dentry->d_sb; ++ bend = arg->bindex; ++ arg->err = 0; ++ arg->called++; ++ //smp_mb(); ++ if (namelen <= AUFS_WH_PFX_LEN ++ || memcmp(name, AUFS_WH_PFX, AUFS_WH_PFX_LEN)) { ++ for (bindex = 0; bindex < bend; bindex++) ++ if (test_known(arg->delist + bindex, name, namelen) ++ || test_known_wh(arg->whlist + bindex, name, ++ namelen)) ++ goto out; /* already exists or whiteouted */ ++ ++ arg->err = xino_read(sb, bend, h_ino, &xino); ++ if (!arg->err && !xino.ino) { ++ //struct inode *h_inode; ++ xino.ino = xino_new_ino(sb); ++ if (unlikely(!xino.ino)) ++ arg->err = -EIO; ++#if 0 ++ //xino.h_gen = AuXino_INVALID_HGEN; ++ h_inode = ilookup(sbr_sb(sb, bend), h_ino); ++ if (h_inode) { ++ if (!is_bad_inode(h_inode)) { ++ xino.h_gen = h_inode->i_generation; ++ WARN_ON(xino.h_gen == AuXino_INVALID_HGEN); ++ } ++ iput(h_inode); ++ } ++#endif ++ arg->err = xino_write(sb, bend, h_ino, &xino); ++ } ++ if (!arg->err) ++ arg->err = append_de(arg->vdir, name, namelen, xino.ino, ++ d_type, arg->delist + bend); ++ } else { ++ name += AUFS_WH_PFX_LEN; ++ namelen -= AUFS_WH_PFX_LEN; ++ for (bindex = 0; bindex < bend; bindex++) ++ if (test_known_wh(arg->whlist + bend, name, namelen)) ++ goto out; /* already whiteouted */ ++ arg->err = append_wh(arg->whlist + bend, name, namelen, bend); ++ } ++ ++ out: ++ if (!arg->err) ++ arg->vdir->vd_jiffy = jiffies; ++ //smp_mb(); ++ TraceErr(arg->err); ++ return arg->err; ++} ++ ++static int read_vdir(struct file *file, int may_read) ++{ ++ int err, do_read, dlgt; ++ struct dentry *dentry; ++ struct inode *inode; ++ struct aufs_vdir *vdir, *allocated; ++ unsigned long expire; ++ struct fillvdir_arg arg; ++ aufs_bindex_t bindex, bend, bstart; ++ struct super_block *sb; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, may %d\n", DLNPair(dentry), may_read); ++ FiMustWriteLock(file); ++ inode = dentry->d_inode; ++ IMustLock(inode); ++ IiMustWriteLock(inode); ++ DEBUG_ON(!S_ISDIR(inode->i_mode)); ++ ++ err = 0; ++ allocated = NULL; ++ do_read = 0; ++ sb = inode->i_sb; ++ expire = stosi(sb)->si_rdcache; ++ vdir = ivdir(inode); ++ if (!vdir) { ++ DEBUG_ON(fvdir_cache(file)); ++ do_read = 1; ++ vdir = alloc_vdir(); ++ err = PTR_ERR(vdir); ++ if (IS_ERR(vdir)) ++ goto out; ++ err = 0; ++ allocated = vdir; ++ } else if (may_read ++ && (inode->i_version != vdir->vd_version ++ || time_after(jiffies, vdir->vd_jiffy + expire))) { ++ LKTRTrace("iver %lu, vdver %lu, exp %lu\n", ++ inode->i_version, vdir->vd_version, ++ vdir->vd_jiffy + expire); ++ do_read = 1; ++ err = reinit_vdir(vdir); ++ if (unlikely(err)) ++ goto out; ++ } ++ //DbgVdir(vdir); goto out; ++ ++ if (!do_read) ++ return 0; /* success */ ++ ++ err = -ENOMEM; ++ bend = fbend(file); ++ arg.delist = kmalloc(sizeof(*arg.delist) * (bend + 1), GFP_KERNEL); ++ if (unlikely(!arg.delist)) ++ goto out_vdir; ++ arg.whlist = kmalloc(sizeof(*arg.whlist) * (bend + 1), GFP_KERNEL); ++ if (unlikely(!arg.whlist)) ++ goto out_delist; ++ err = 0; ++ for (bindex = 0; bindex <= bend; bindex++) { ++ nhash_init(arg.delist + bindex); ++ nhash_init(arg.whlist + bindex); ++ } ++ ++ dlgt = need_dlgt(sb); ++ arg.file = file; ++ arg.vdir = vdir; ++ bstart = fbstart(file); ++ for (bindex = bstart; !err && bindex <= bend; bindex++) { ++ struct file *hf; ++ struct inode *h_inode; ++ ++ hf = au_h_fptr_i(file, bindex); ++ if (!hf) ++ continue; ++ ++ h_inode = hf->f_dentry->d_inode; ++ //hf->f_pos = 0; ++ arg.bindex = bindex; ++ do { ++ arg.err = 0; ++ arg.called = 0; ++ //smp_mb(); ++ err = vfsub_readdir(hf, fillvdir, &arg, dlgt); ++ if (err >= 0) ++ err = arg.err; ++ } while (!err && arg.called); ++ } ++ ++ for (bindex = bstart; bindex <= bend; bindex++) { ++ free_dehlist(arg.delist + bindex); ++ nhash_fin(arg.whlist + bindex); ++ } ++ kfree(arg.whlist); ++ ++ out_delist: ++ kfree(arg.delist); ++ out_vdir: ++ if (!err) { ++ //file->f_pos = 0; ++ vdir->vd_version = inode->i_version; ++ vdir->vd_last.i = 0; ++ vdir->vd_last.p.deblk = vdir->vd_deblk[0]; ++ if (allocated) ++ set_ivdir(inode, allocated); ++ } else if (allocated) ++ free_vdir(allocated); ++ //DbgVdir(vdir); goto out; ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static int copy_vdir(struct aufs_vdir *tgt, struct aufs_vdir *src) ++{ ++ int err, i, rerr, n; ++ ++ TraceEnter(); ++ DEBUG_ON(tgt->vd_nblk != 1); ++ //DbgVdir(tgt); ++ ++ err = -ENOMEM; ++ if (tgt->vd_nblk < src->vd_nblk) { ++ aufs_deblk_t **p; ++ p = au_kzrealloc(tgt->vd_deblk, sizeof(*p) * tgt->vd_nblk, ++ sizeof(*p) * src->vd_nblk, GFP_KERNEL); ++ if (unlikely(!p)) ++ goto out; ++ tgt->vd_deblk = p; ++ } ++ ++ n = tgt->vd_nblk = src->vd_nblk; ++ memcpy(tgt->vd_deblk[0], src->vd_deblk[0], AUFS_DEBLK_SIZE); ++ //tgt->vd_last.i = 0; ++ //tgt->vd_last.p.deblk = tgt->vd_deblk[0]; ++ tgt->vd_version = src->vd_version; ++ tgt->vd_jiffy = src->vd_jiffy; ++ ++ for (i = 1; i < n; i++) { ++ tgt->vd_deblk[i] = kmalloc(AUFS_DEBLK_SIZE, GFP_KERNEL); ++ if (tgt->vd_deblk[i]) ++ memcpy(tgt->vd_deblk[i], src->vd_deblk[i], ++ AUFS_DEBLK_SIZE); ++ else ++ goto out; ++ } ++ //smp_mb(); ++ //DbgVdir(tgt); ++ return 0; /* success */ ++ ++ out: ++ rerr = reinit_vdir(tgt); ++ BUG_ON(rerr); ++ TraceErr(err); ++ return err; ++} ++ ++int au_init_vdir(struct file *file) ++{ ++ int err; ++ struct dentry *dentry; ++ struct inode *inode; ++ struct aufs_vdir *vdir_cache, *allocated; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, pos %Ld\n", DLNPair(dentry), file->f_pos); ++ FiMustWriteLock(file); ++ inode = dentry->d_inode; ++ IiMustWriteLock(inode); ++ DEBUG_ON(!S_ISDIR(inode->i_mode)); ++ ++ err = read_vdir(file, !file->f_pos); ++ if (unlikely(err)) ++ goto out; ++ //DbgVdir(ivdir(inode)); goto out; ++ ++ allocated = NULL; ++ vdir_cache = fvdir_cache(file); ++ if (!vdir_cache) { ++ vdir_cache = alloc_vdir(); ++ err = PTR_ERR(vdir_cache); ++ if (IS_ERR(vdir_cache)) ++ goto out; ++ allocated = vdir_cache; ++ } else if (!file->f_pos && vdir_cache->vd_version != file->f_version) { ++ err = reinit_vdir(vdir_cache); ++ if (unlikely(err)) ++ goto out; ++ } else ++ return 0; /* success */ ++ //err = 0; DbgVdir(vdir_cache); goto out; ++ ++ err = copy_vdir(vdir_cache, ivdir(inode)); ++ if (!err) { ++ file->f_version = inode->i_version; ++ if (allocated) ++ set_fvdir_cache(file, allocated); ++ } else if (allocated) ++ free_vdir(allocated); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++static loff_t calc_offset(struct aufs_vdir *vdir) ++{ ++ loff_t offset; ++ union aufs_deblk_p p; ++ ++ p.deblk = vdir->vd_deblk[vdir->vd_last.i]; ++ offset = vdir->vd_last.p.p - p.p; ++ offset += sizeof(*p.deblk) * vdir->vd_last.i; ++ return offset; ++} ++ ++/* returns true or false */ ++static int seek_vdir(struct file *file) ++{ ++ int valid, i, n; ++ struct dentry *dentry; ++ struct aufs_vdir *vdir_cache; ++ loff_t offset; ++ union aufs_deblk_p p, deblk_end; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, pos %Ld\n", DLNPair(dentry), file->f_pos); ++ vdir_cache = fvdir_cache(file); ++ DEBUG_ON(!vdir_cache); ++ //DbgVdir(vdir_cache); ++ ++ valid = 1; ++ offset = calc_offset(vdir_cache); ++ LKTRTrace("offset %Ld\n", offset); ++ if (file->f_pos == offset) ++ goto out; ++ ++ vdir_cache->vd_last.i = 0; ++ vdir_cache->vd_last.p.deblk = vdir_cache->vd_deblk[0]; ++ if (!file->f_pos) ++ goto out; ++ ++ valid = 0; ++ i = file->f_pos / AUFS_DEBLK_SIZE; ++ LKTRTrace("i %d\n", i); ++ if (i >= vdir_cache->vd_nblk) ++ goto out; ++ ++ n = vdir_cache->vd_nblk; ++ //DbgVdir(vdir_cache); ++ for (; i < n; i++) { ++ p.deblk = vdir_cache->vd_deblk[i]; ++ deblk_end.deblk = p.deblk + 1; ++ offset = i * AUFS_DEBLK_SIZE; ++ while (!is_deblk_end(&p, &deblk_end) && offset < file->f_pos) { ++ int l; ++ l = calc_size(p.de->de_str.len); ++ offset += l; ++ p.p += l; ++ } ++ if (!is_deblk_end(&p, &deblk_end)) { ++ valid = 1; ++ vdir_cache->vd_last.i = i; ++ vdir_cache->vd_last.p = p; ++ break; ++ } ++ } ++ ++ out: ++ //smp_mb(); ++ //DbgVdir(vdir_cache); ++ TraceErr(!valid); ++ return valid; ++} ++ ++int au_fill_de(struct file *file, void *dirent, filldir_t filldir) ++{ ++ int err, l; ++ struct dentry *dentry; ++ struct aufs_vdir *vdir_cache; ++ struct aufs_de *de; ++ union aufs_deblk_p deblk_end; ++ ++ dentry = file->f_dentry; ++ LKTRTrace("%.*s, pos %Ld\n", DLNPair(dentry), file->f_pos); ++ vdir_cache = fvdir_cache(file); ++ DEBUG_ON(!vdir_cache); ++ //DbgVdir(vdir_cache); ++ ++ if (!seek_vdir(file)) ++ return 0; ++ ++ while (1) { ++ deblk_end.deblk ++ = vdir_cache->vd_deblk[vdir_cache->vd_last.i] + 1; ++ while (!is_deblk_end(&vdir_cache->vd_last.p, &deblk_end)) { ++ de = vdir_cache->vd_last.p.de; ++ LKTRTrace("%.*s, off%Ld, i%lu, dt%d\n", ++ de->de_str.len, de->de_str.name, ++ file->f_pos, de->de_ino, de->de_type); ++ err = filldir(dirent, de->de_str.name, de->de_str.len, ++ file->f_pos, de->de_ino, de->de_type); ++ if (unlikely(err)) { ++ TraceErr(err); ++ //return err; ++ //todo: ignore the error caused by udba. ++ return 0; ++ } ++ ++ l = calc_size(de->de_str.len); ++ vdir_cache->vd_last.p.p += l; ++ file->f_pos += l; ++ } ++ if (vdir_cache->vd_last.i < vdir_cache->vd_nblk - 1) { ++ vdir_cache->vd_last.i++; ++ vdir_cache->vd_last.p.deblk ++ = vdir_cache->vd_deblk[vdir_cache->vd_last.i]; ++ file->f_pos = sizeof(*vdir_cache->vd_last.p.deblk) ++ * vdir_cache->vd_last.i; ++ continue; ++ } ++ break; ++ } ++ ++ //smp_mb(); ++ return 0; ++} +diff --git a/fs/aufs/vfsub.c b/fs/aufs/vfsub.c +new file mode 100755 +index 0000000..8571d21 +--- /dev/null ++++ b/fs/aufs/vfsub.c +@@ -0,0 +1,665 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: vfsub.c,v 1.5 2007/04/23 00:55:06 sfjro Exp $ */ ++// I'm going to slightly mad ++ ++#include "aufs.h" ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_DLGT ++struct permission_args { ++ int *errp; ++ struct inode *inode; ++ int mask; ++ struct nameidata *nd; ++}; ++ ++static void call_permission(void *args) ++{ ++ struct permission_args *a = args; ++ *a->errp = do_vfsub_permission(a->inode, a->mask, a->nd); ++} ++ ++int vfsub_permission(struct inode *inode, int mask, struct nameidata *nd, ++ int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_permission(inode, mask, nd); ++ else { ++ int err; ++ struct permission_args args = { ++ .errp = &err, ++ .inode = inode, ++ .mask = mask, ++ .nd = nd ++ }; ++ au_wkq_wait(call_permission, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct create_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *dentry; ++ int mode; ++ struct nameidata *nd; ++}; ++ ++static void call_create(void *args) ++{ ++ struct create_args *a = args; ++ *a->errp = do_vfsub_create(a->dir, a->dentry, a->mode, a->nd); ++} ++ ++int vfsub_create(struct inode *dir, struct dentry *dentry, int mode, ++ struct nameidata *nd, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_create(dir, dentry, mode, nd); ++ else { ++ int err; ++ struct create_args args = { ++ .errp = &err, ++ .dir = dir, ++ .dentry = dentry, ++ .mode = mode, ++ .nd = nd ++ }; ++ au_wkq_wait(call_create, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct symlink_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *dentry; ++ const char *symname; ++ int mode; ++}; ++ ++static void call_symlink(void *args) ++{ ++ struct symlink_args *a = args; ++ *a->errp = do_vfsub_symlink(a->dir, a->dentry, a->symname, a->mode); ++} ++ ++int vfsub_symlink(struct inode *dir, struct dentry *dentry, const char *symname, ++ int mode, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_symlink(dir, dentry, symname, mode); ++ else { ++ int err; ++ struct symlink_args args = { ++ .errp = &err, ++ .dir = dir, ++ .dentry = dentry, ++ .symname = symname, ++ .mode = mode ++ }; ++ au_wkq_wait(call_symlink, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct mknod_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *dentry; ++ int mode; ++ dev_t dev; ++}; ++ ++static void call_mknod(void *args) ++{ ++ struct mknod_args *a = args; ++ *a->errp = do_vfsub_mknod(a->dir, a->dentry, a->mode, a->dev); ++} ++ ++int vfsub_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev, ++ int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_mknod(dir, dentry, mode, dev); ++ else { ++ int err; ++ struct mknod_args args = { ++ .errp = &err, ++ .dir = dir, ++ .dentry = dentry, ++ .mode = mode, ++ .dev = dev ++ }; ++ au_wkq_wait(call_mknod, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct mkdir_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *dentry; ++ int mode; ++}; ++ ++static void call_mkdir(void *args) ++{ ++ struct mkdir_args *a = args; ++ *a->errp = do_vfsub_mkdir(a->dir, a->dentry, a->mode); ++} ++ ++int vfsub_mkdir(struct inode *dir, struct dentry *dentry, int mode, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_mkdir(dir, dentry, mode); ++ else { ++ int err; ++ struct mkdir_args args = { ++ .errp = &err, ++ .dir = dir, ++ .dentry = dentry, ++ .mode = mode ++ }; ++ au_wkq_wait(call_mkdir, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct link_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *src_dentry, *dentry; ++}; ++ ++static void call_link(void *args) ++{ ++ struct link_args *a = args; ++ *a->errp = do_vfsub_link(a->src_dentry, a->dir, a->dentry); ++} ++ ++int vfsub_link(struct dentry *src_dentry, struct inode *dir, ++ struct dentry *dentry, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_link(src_dentry, dir, dentry); ++ else { ++ int err; ++ struct link_args args = { ++ .errp = &err, ++ .src_dentry = src_dentry, ++ .dir = dir, ++ .dentry = dentry ++ }; ++ au_wkq_wait(call_link, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct rename_args { ++ int *errp; ++ struct inode *src_dir, *dir; ++ struct dentry *src_dentry, *dentry; ++}; ++ ++static void call_rename(void *args) ++{ ++ struct rename_args *a = args; ++ *a->errp = do_vfsub_rename(a->src_dir, a->src_dentry, a->dir, ++ a->dentry); ++} ++ ++int vfsub_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_rename(src_dir, src_dentry, dir, dentry); ++ else { ++ int err; ++ struct rename_args args = { ++ .errp = &err, ++ .src_dir = src_dir, ++ .src_dentry = src_dentry, ++ .dir = dir, ++ .dentry = dentry ++ }; ++ au_wkq_wait(call_rename, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct rmdir_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *dentry; ++}; ++ ++static void call_rmdir(void *args) ++{ ++ struct rmdir_args *a = args; ++ *a->errp = do_vfsub_rmdir(a->dir, a->dentry); ++} ++ ++int vfsub_rmdir(struct inode *dir, struct dentry *dentry, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_rmdir(dir, dentry); ++ else { ++ int err; ++ struct rmdir_args args = { ++ .errp = &err, ++ .dir = dir, ++ .dentry = dentry ++ }; ++ au_wkq_wait(call_rmdir, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct read_args { ++ ssize_t *errp; ++ struct file *file; ++ union { ++ void *kbuf; ++ char __user *ubuf; ++ }; ++ size_t count; ++ loff_t *ppos; ++}; ++ ++static void call_read_k(void *args) ++{ ++ struct read_args *a = args; ++ LKTRTrace("%.*s, cnt %lu, pos %Ld\n", ++ DLNPair(a->file->f_dentry), (unsigned long)a->count, ++ *a->ppos); ++ *a->errp = do_vfsub_read_k(a->file, a->kbuf, a->count, a->ppos); ++} ++ ++ssize_t vfsub_read_u(struct file *file, char __user *ubuf, size_t count, ++ loff_t *ppos, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_read_u(file, ubuf, count, ppos); ++ else { ++ ssize_t err, read; ++ struct read_args args = { ++ .errp = &err, ++ .file = file, ++ .count = count, ++ .ppos = ppos ++ }; ++ ++ if (unlikely(!count)) ++ return 0; ++ ++ /* ++ * workaround an application bug. ++ * generally, read(2) or write(2) may return the value shorter ++ * than requested. But many applications don't support it, ++ * for example bash. ++ */ ++ err = -ENOMEM; ++ if (args.count > PAGE_SIZE) ++ args.count = PAGE_SIZE; ++ args.kbuf = kmalloc(args.count, GFP_KERNEL); ++ if (unlikely(!args.kbuf)) ++ goto out; ++ ++ read = 0; ++ do { ++ au_wkq_wait(call_read_k, &args, /*dlgt*/1); ++ if (unlikely(err > 0 ++ && copy_to_user(ubuf, args.kbuf, err))) { ++ err = -EFAULT; ++ goto out_free; ++ } else if (!err) ++ break; ++ else if (unlikely(err < 0)) ++ goto out_free; ++ count -= err; ++ /* do not read too much because of file i/o pointer */ ++ if (unlikely(count < args.count)) ++ args.count = count; ++ ubuf += err; ++ read += err; ++ } while (count); ++ smp_mb(); ++ err = read; ++ ++ out_free: ++ kfree(args.kbuf); ++ out: ++ return err; ++ } ++} ++ ++ssize_t vfsub_read_k(struct file *file, void *kbuf, size_t count, loff_t *ppos, ++ int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_read_k(file, kbuf, count, ppos); ++ else { ++ ssize_t err; ++ struct read_args args = { ++ .errp = &err, ++ .file = file, ++ .count = count, ++ .ppos = ppos ++ }; ++ args.kbuf = kbuf; ++ au_wkq_wait(call_read_k, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct write_args { ++ ssize_t *errp; ++ struct file *file; ++ union { ++ void *kbuf; ++ const char __user *ubuf; ++ }; ++ void *buf; ++ size_t count; ++ loff_t *ppos; ++}; ++ ++static void call_write_k(void *args) ++{ ++ struct write_args *a = args; ++ LKTRTrace("%.*s, cnt %lu, pos %Ld\n", ++ DLNPair(a->file->f_dentry), (unsigned long)a->count, ++ *a->ppos); ++ *a->errp = do_vfsub_write_k(a->file, a->kbuf, a->count, a->ppos); ++} ++ ++ssize_t vfsub_write_u(struct file *file, const char __user *ubuf, size_t count, ++ loff_t *ppos, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_write_u(file, ubuf, count, ppos); ++ else { ++ ssize_t err, written; ++ struct write_args args = { ++ .errp = &err, ++ .file = file, ++ .count = count, ++ .ppos = ppos ++ }; ++ ++ if (unlikely(!count)) ++ return 0; ++ ++ /* ++ * workaround an application bug. ++ * generally, read(2) or write(2) may return the value shorter ++ * than requested. But many applications don't support it, ++ * for example bash. ++ */ ++ err = -ENOMEM; ++ if (args.count > PAGE_SIZE) ++ args.count = PAGE_SIZE; ++ args.kbuf = kmalloc(args.count, GFP_KERNEL); ++ if (unlikely(!args.kbuf)) ++ goto out; ++ ++ written = 0; ++ do { ++ if (unlikely(copy_from_user(args.kbuf, ubuf, args.count))) { ++ err = -EFAULT; ++ goto out_free; ++ } ++ ++ au_wkq_wait(call_write_k, &args, /*dlgt*/1); ++ if (err > 0) { ++ count -= err; ++ if (count < args.count) ++ args.count = count; ++ ubuf += err; ++ written += err; ++ } else if (!err) ++ break; ++ else if (unlikely(err < 0)) ++ goto out_free; ++ } while (count); ++ err = written; ++ ++ out_free: ++ kfree(args.kbuf); ++ out: ++ return err; ++ } ++} ++ ++ssize_t vfsub_write_k(struct file *file, void *kbuf, size_t count, loff_t *ppos, ++ int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_write_k(file, kbuf, count, ppos); ++ else { ++ ssize_t err; ++ struct write_args args = { ++ .errp = &err, ++ .file = file, ++ .count = count, ++ .ppos = ppos ++ }; ++ args.kbuf = kbuf; ++ au_wkq_wait(call_write_k, &args, /*dlgt*/1); ++ return err; ++ } ++} ++ ++struct readdir_args { ++ int *errp; ++ struct file *file; ++ filldir_t filldir; ++ void *arg; ++}; ++ ++static void call_readdir(void *args) ++{ ++ struct readdir_args *a = args; ++ *a->errp = do_vfsub_readdir(a->file, a->filldir, a->arg); ++} ++ ++int vfsub_readdir(struct file *file, filldir_t filldir, void *arg, int dlgt) ++{ ++ if (!dlgt) ++ return do_vfsub_readdir(file, filldir, arg); ++ else { ++ int err; ++ struct readdir_args args = { ++ .errp = &err, ++ .file = file, ++ .filldir = filldir, ++ .arg = arg ++ }; ++ au_wkq_wait(call_readdir, &args, /*dlgt*/1); ++ return err; ++ } ++} ++#endif /* CONFIG_AUFS_DLGT */ ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct notify_change_args { ++ int *errp; ++ struct dentry *h_dentry; ++ struct iattr *ia; ++}; ++ ++static void call_notify_change(void *args) ++{ ++ struct notify_change_args *a = args; ++ struct inode *h_inode; ++ ++ LKTRTrace("%.*s, ia_valid 0x%x\n", ++ DLNPair(a->h_dentry), a->ia->ia_valid); ++ h_inode = a->h_dentry->d_inode; ++ IMustLock(h_inode); ++ ++ *a->errp = -EPERM; ++ if (!IS_IMMUTABLE(h_inode) && !IS_APPEND(h_inode)) { ++ lockdep_off(); ++ *a->errp = notify_change(a->h_dentry, a->ia); ++ lockdep_on(); ++ } ++ TraceErr(*a->errp); ++} ++ ++int vfsub_notify_change(struct dentry *dentry, struct iattr *ia, int dlgt) ++{ ++ int err; ++ struct notify_change_args args = { ++ .errp = &err, ++ .h_dentry = dentry, ++ .ia = ia ++ }; ++ ++#ifndef CONFIG_AUFS_DLGT ++ call_notify_change(&args); ++#else ++ if (!dlgt) ++ call_notify_change(&args); ++ else ++ au_wkq_wait(call_notify_change, &args, /*dlgt*/1); ++#endif ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct unlink_args { ++ int *errp; ++ struct inode *dir; ++ struct dentry *dentry; ++}; ++ ++static void call_unlink(void *args) ++{ ++ struct unlink_args *a = args; ++ struct inode *h_inode; ++ const int stop_sillyrename = (au_is_nfs(a->dentry->d_sb) ++ && atomic_read(&a->dentry->d_count) == 1); ++ ++ LKTRTrace("%.*s, stop_silly %d, cnt %d\n", ++ DLNPair(a->dentry), stop_sillyrename, ++ atomic_read(&a->dentry->d_count)); ++ IMustLock(a->dir); ++ ++ if (!stop_sillyrename) ++ dget(a->dentry); ++ h_inode = a->dentry->d_inode; ++ if (h_inode) ++ atomic_inc(&h_inode->i_count); ++#if 0 // partial testing ++ { ++ struct qstr *name = &a->dentry->d_name; ++ if (name->len == sizeof(AUFS_XINO_FNAME) - 1 ++ && !strncmp(name->name, AUFS_XINO_FNAME, name->len)) { ++ lockdep_off(); ++ *a->errp = vfs_unlink(a->dir, a->dentry); ++ lockdep_on(); ++ } else ++ err = -1; ++ } ++#else ++ // vfs_unlink() locks inode ++ lockdep_off(); ++ *a->errp = vfs_unlink(a->dir, a->dentry); ++ lockdep_on(); ++#endif ++ ++ if (!stop_sillyrename) ++ dput(a->dentry); ++ if (h_inode) ++ iput(h_inode); ++ ++ TraceErr(*a->errp); ++} ++ ++/* ++ * @dir: must be locked. ++ * @dentry: target dentry. ++ */ ++int vfsub_unlink(struct inode *dir, struct dentry *dentry, int dlgt) ++{ ++ int err; ++ struct unlink_args args = { ++ .errp = &err, ++ .dir = dir, ++ .dentry = dentry ++ }; ++ ++#ifndef CONFIG_AUFS_DLGT ++ call_unlink(&args); ++#else ++ if (!dlgt) ++ call_unlink(&args); ++ else ++ au_wkq_wait(call_unlink, &args, /*dlgt*/1); ++#endif ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct statfs_args { ++ int *errp; ++ void *arg; ++ struct kstatfs *buf; ++}; ++ ++static void call_statfs(void *args) ++{ ++ struct statfs_args *a = args; ++ *a->errp = vfs_statfs(a->arg, a->buf); ++} ++ ++int vfsub_statfs(void *arg, struct kstatfs *buf, int dlgt) ++{ ++ int err; ++ struct statfs_args args = { ++ .errp = &err, ++ .arg = arg, ++ .buf = buf ++ }; ++ ++#ifndef CONFIG_AUFS_DLGT ++ call_statfs(&args); ++#else ++ if (!dlgt) ++ call_statfs(&args); ++ else ++ au_wkq_wait(call_statfs, &args, /*dlgt*/1); ++#endif ++ return err; ++} +diff --git a/fs/aufs/vfsub.h b/fs/aufs/vfsub.h +new file mode 100755 +index 0000000..52f15cc +--- /dev/null ++++ b/fs/aufs/vfsub.h +@@ -0,0 +1,427 @@ ++/* ++ * Copyright (C) 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: vfsub.h,v 1.8 2007/05/14 03:39:10 sfjro Exp $ */ ++ ++#ifndef __AUFS_VFSUB_H__ ++#define __AUFS_VFSUB_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <asm/uaccess.h> ++#include "wkq.h" ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* simple abstractions, for future use */ ++static inline ++int do_vfsub_permission(struct inode *inode, int mask, struct nameidata *nd) ++{ ++ LKTRTrace("i%lu, mask 0x%x, nd %p\n", inode->i_ino, mask, nd); ++#if 0 ++#else ++ return permission(inode, mask, nd); ++#endif ++} ++ ++static inline ++struct file *vfsub_filp_open(const char *path, int oflags, int mode) ++{ ++ struct file *err; ++ ++ LKTRTrace("%s\n", path); ++ ++ lockdep_off(); ++ err = filp_open(path, oflags, mode); ++ lockdep_on(); ++ return err; ++} ++ ++static inline ++int vfsub_path_lookup(const char *name, unsigned int flags, ++ struct nameidata *nd) ++{ ++ int err; ++ ++ LKTRTrace("%s\n", name); ++ ++ //lockdep_off(); ++ err = path_lookup(name, flags, nd); ++ //lockdep_on(); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline ++int do_vfsub_create(struct inode *dir, struct dentry *dentry, int mode, ++ struct nameidata *nd) ++{ ++ LKTRTrace("i%lu, %.*s, 0x%x\n", dir->i_ino, DLNPair(dentry), mode); ++#if 0 ++#else ++ return vfs_create(dir, dentry, mode, nd); ++#endif ++} ++ ++static inline ++int do_vfsub_symlink(struct inode *dir, struct dentry *dentry, ++ const char *symname, int mode) ++{ ++ LKTRTrace("i%lu, %.*s, %s, 0x%x\n", ++ dir->i_ino, DLNPair(dentry), symname, mode); ++#if 0 ++#else ++ return vfs_symlink(dir, dentry, symname, mode); ++#endif ++} ++ ++static inline ++int do_vfsub_mknod(struct inode *dir, struct dentry *dentry, int mode, ++ dev_t dev) ++{ ++ LKTRTrace("i%lu, %.*s, 0x%x\n", dir->i_ino, DLNPair(dentry), mode); ++#if 0 ++#else ++ return vfs_mknod(dir, dentry, mode, dev); ++#endif ++} ++ ++static inline ++int do_vfsub_link(struct dentry *src_dentry, struct inode *dir, ++ struct dentry *dentry) ++{ ++ int err; ++ ++ LKTRTrace("%.*s, i%lu, %.*s\n", ++ DLNPair(src_dentry), dir->i_ino, DLNPair(dentry)); ++ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_link(src_dentry, dir, dentry); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++static inline ++int do_vfsub_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry) ++{ ++ int err; ++ ++ LKTRTrace("i%lu, %.*s, i%lu, %.*s\n", ++ src_dir->i_ino, DLNPair(src_dentry), ++ dir->i_ino, DLNPair(dentry)); ++ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_rename(src_dir, src_dentry, dir, dentry); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++static inline ++int do_vfsub_mkdir(struct inode *dir, struct dentry *dentry, int mode) ++{ ++ LKTRTrace("i%lu, %.*s, 0x%x\n", dir->i_ino, DLNPair(dentry), mode); ++#if 0 ++#else ++ return vfs_mkdir(dir, dentry, mode); ++#endif ++} ++ ++static inline int do_vfsub_rmdir(struct inode *dir, struct dentry *dentry) ++{ ++ int err; ++ ++ LKTRTrace("i%lu, %.*s\n", dir->i_ino, DLNPair(dentry)); ++ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_rmdir(dir, dentry); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline ++ssize_t do_vfsub_read_u(struct file *file, char __user *ubuf, size_t count, ++ loff_t *ppos) ++{ ++ ssize_t err; ++ ++ LKTRTrace("%.*s, cnt %lu, pos %Ld\n", ++ DLNPair(file->f_dentry), (unsigned long)count, *ppos); ++ ++ /* nfs uses some locks */ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_read(file, ubuf, count, ppos); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++// kernel_read() ?? ++static inline ++ssize_t do_vfsub_read_k(struct file *file, void *kbuf, size_t count, ++ loff_t *ppos) ++{ ++ ssize_t err; ++ mm_segment_t oldfs; ++ ++ oldfs = get_fs(); ++ set_fs(KERNEL_DS); ++ err = do_vfsub_read_u(file, (char __user*)kbuf, count, ppos); ++ set_fs(oldfs); ++ return err; ++} ++ ++static inline ++ssize_t do_vfsub_write_u(struct file *file, const char __user *ubuf, ++ size_t count, loff_t *ppos) ++{ ++ ssize_t err; ++ ++ LKTRTrace("%.*s, cnt %lu, pos %Ld\n", ++ DLNPair(file->f_dentry), (unsigned long)count, *ppos); ++ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_write(file, ubuf, count, ppos); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++static inline ++ssize_t do_vfsub_write_k(struct file *file, void *kbuf, size_t count, ++ loff_t *ppos) ++{ ++ ssize_t err; ++ mm_segment_t oldfs; ++ ++ oldfs = get_fs(); ++ set_fs(KERNEL_DS); ++ err = do_vfsub_write_u(file, (const char __user*)kbuf, count, ppos); ++ set_fs(oldfs); ++ return err; ++} ++ ++static inline ++int do_vfsub_readdir(struct file *file, filldir_t filldir, void *arg) ++{ ++ int err; ++ ++ LKTRTrace("%.*s\n", DLNPair(file->f_dentry)); ++ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_readdir(file, filldir, arg); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline loff_t vfsub_llseek(struct file *file, loff_t offset, int origin) ++{ ++ loff_t err; ++ ++ LKTRTrace("%.*s\n", DLNPair(file->f_dentry)); ++ ++ lockdep_off(); ++#if 0 ++#else ++ err = vfs_llseek(file, offset, origin); ++#endif ++ lockdep_on(); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_DLGT ++static inline int need_dlgt(struct super_block *sb) ++{ ++ return (au_flag_test(sb, AuFlag_DLGT) && !is_au_wkq(current)); ++} ++ ++int vfsub_permission(struct inode *inode, int mask, struct nameidata *nd, ++ int dlgt); ++ ++int vfsub_create(struct inode *dir, struct dentry *dentry, int mode, ++ struct nameidata *nd, int dlgt); ++int vfsub_symlink(struct inode *dir, struct dentry *dentry, const char *symname, ++ int mode, int dlgt); ++int vfsub_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev, ++ int dlgt); ++int vfsub_link(struct dentry *src_dentry, struct inode *dir, ++ struct dentry *dentry, int dlgt); ++int vfsub_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry, int dlgt); ++int vfsub_mkdir(struct inode *dir, struct dentry *dentry, int mode, int dlgt); ++int vfsub_rmdir(struct inode *dir, struct dentry *dentry, int dlgt); ++ ++ssize_t vfsub_read_u(struct file *file, char __user *ubuf, size_t count, ++ loff_t *ppos, int dlgt); ++ssize_t vfsub_read_k(struct file *file, void *kbuf, size_t count, loff_t *ppos, ++ int dlgt); ++ssize_t vfsub_write_u(struct file *file, const char __user *ubuf, size_t count, ++ loff_t *ppos, int dlgt); ++ssize_t vfsub_write_k(struct file *file, void *kbuf, size_t count, loff_t *ppos, ++ int dlgt); ++int vfsub_readdir(struct file *file, filldir_t filldir, void *arg, int dlgt); ++ ++#else ++ ++static inline int need_dlgt(struct super_block *sb) ++{ ++ return 0; ++} ++ ++static inline ++int vfsub_permission(struct inode *inode, int mask, struct nameidata *nd, ++ int dlgt) ++{ ++ return do_vfsub_permission(inode, mask, nd); ++} ++ ++static inline ++int vfsub_create(struct inode *dir, struct dentry *dentry, int mode, ++ struct nameidata *nd, int dlgt) ++{ ++ return do_vfsub_create(dir, dentry, mode, nd); ++} ++ ++static inline ++int vfsub_symlink(struct inode *dir, struct dentry *dentry, const char *symname, ++ int mode, int dlgt) ++{ ++ return do_vfsub_symlink(dir, dentry, symname, mode); ++} ++ ++static inline ++int vfsub_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev, ++ int dlgt) ++{ ++ return do_vfsub_mknod(dir, dentry, mode, dev); ++} ++ ++static inline ++int vfsub_link(struct dentry *src_dentry, struct inode *dir, ++ struct dentry *dentry, int dlgt) ++{ ++ return do_vfsub_link(src_dentry, dir, dentry); ++} ++ ++static inline ++int vfsub_rename(struct inode *src_dir, struct dentry *src_dentry, ++ struct inode *dir, struct dentry *dentry, int dlgt) ++{ ++ return do_vfsub_rename(src_dir, src_dentry, dir, dentry); ++} ++ ++static inline ++int vfsub_mkdir(struct inode *dir, struct dentry *dentry, int mode, ++ int dlgt) ++{ ++ return do_vfsub_mkdir(dir, dentry, mode); ++} ++ ++static inline ++int vfsub_rmdir(struct inode *dir, struct dentry *dentry, int dlgt) ++{ ++ return do_vfsub_rmdir(dir, dentry); ++} ++ ++static inline ++ssize_t vfsub_read_u(struct file *file, char __user *ubuf, size_t count, ++ loff_t *ppos, int dlgt) ++{ ++ return do_vfsub_read_u(file, ubuf, count, ppos); ++} ++ ++static inline ++ssize_t vfsub_read_k(struct file *file, void *kbuf, size_t count, loff_t *ppos, ++ int dlgt) ++{ ++ return do_vfsub_read_k(file, kbuf, count, ppos); ++} ++ ++static inline ++ssize_t vfsub_write_u(struct file *file, const char __user *ubuf, size_t count, ++ loff_t *ppos, int dlgt) ++{ ++ return do_vfsub_write_u(file, ubuf, count, ppos); ++} ++ ++static inline ++ssize_t vfsub_write_k(struct file *file, void *kbuf, size_t count, loff_t *ppos, ++ int dlgt) ++{ ++ return do_vfsub_write_k(file, kbuf, count, ppos); ++} ++ ++static inline ++int vfsub_readdir(struct file *file, filldir_t filldir, void *arg, int dlgt) ++{ ++ return do_vfsub_readdir(file, filldir, arg); ++} ++#endif /* CONFIG_AUFS_DLGT */ ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline ++struct dentry *vfsub_lock_rename(struct dentry *d1, struct dentry *d2) ++{ ++ struct dentry *d; ++ ++ lockdep_off(); ++ d = lock_rename(d1, d2); ++ lockdep_on(); ++ return d; ++} ++ ++static inline void vfsub_unlock_rename(struct dentry *d1, struct dentry *d2) ++{ ++ lockdep_off(); ++ unlock_rename(d1, d2); ++ lockdep_on(); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++int vfsub_notify_change(struct dentry *dentry, struct iattr *ia, int dlgt); ++int vfsub_unlink(struct inode *dir, struct dentry *dentry, int dlgt); ++int vfsub_statfs(void *arg, struct kstatfs *buf, int dlgt); ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_VFSUB_H__ */ +diff --git a/fs/aufs/whout.c b/fs/aufs/whout.c +new file mode 100755 +index 0000000..b7f874c +--- /dev/null ++++ b/fs/aufs/whout.c +@@ -0,0 +1,933 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: whout.c,v 1.14 2007/05/14 03:40:40 sfjro Exp $ */ ++ ++#include <linux/fs.h> ++#include <linux/namei.h> ++#include <linux/random.h> ++#include <linux/security.h> ++#include "aufs.h" ++ ++#define WH_MASK S_IRUGO ++ ++/* If a directory contains this file, then it is opaque. We start with the ++ * .wh. flag so that it is blocked by lookup. ++ */ ++static struct qstr diropq_name = { ++ .name = AUFS_WH_DIROPQ, ++ .len = sizeof(AUFS_WH_DIROPQ) - 1 ++}; ++ ++/* ++ * generate whiteout name, which is NOT terminated by NULL. ++ * @name: original d_name.name ++ * @len: original d_name.len ++ * @wh: whiteout qstr ++ * returns zero when succeeds, otherwise error. ++ * succeeded value as wh->name should be freed by au_free_whname(). ++ */ ++int au_alloc_whname(const char *name, int len, struct qstr *wh) ++{ ++ char *p; ++ ++ DEBUG_ON(!name || !len || !wh); ++ ++ if (unlikely(len > PATH_MAX - AUFS_WH_PFX_LEN)) ++ return -ENAMETOOLONG; ++ ++ wh->len = len + AUFS_WH_PFX_LEN; ++ wh->name = p = kmalloc(wh->len, GFP_KERNEL); ++ //if (LktrCond) {kfree(p); wh->name = p = NULL;} ++ if (p) { ++ memcpy(p, AUFS_WH_PFX, AUFS_WH_PFX_LEN); ++ memcpy(p + AUFS_WH_PFX_LEN, name, len); ++ //smp_mb(); ++ return 0; ++ } ++ return -ENOMEM; ++} ++ ++void au_free_whname(struct qstr *wh) ++{ ++ DEBUG_ON(!wh || !wh->name); ++ kfree(wh->name); ++#ifdef CONFIG_AUFS_DEBUG ++ wh->name = NULL; ++#endif ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * test if the @wh_name exists under @hidden_parent. ++ * @try_sio specifies the necessary of super-io. ++ */ ++int is_wh(struct dentry *hidden_parent, struct qstr *wh_name, int try_sio, ++ struct lkup_args *lkup) ++{ ++ int err; ++ struct dentry *wh_dentry; ++ struct inode *hidden_dir; ++ ++ LKTRTrace("%.*s/%.*s, lkup{%p, %d}\n", DLNPair(hidden_parent), ++ wh_name->len, wh_name->name, lkup->nfsmnt, lkup->dlgt); ++ hidden_dir = hidden_parent->d_inode; ++ DEBUG_ON(!S_ISDIR(hidden_dir->i_mode)); ++ IMustLock(hidden_dir); ++ ++ if (!try_sio) ++ wh_dentry = lkup_one(wh_name->name, hidden_parent, ++ wh_name->len, lkup); ++ else ++ wh_dentry = sio_lkup_one(wh_name->name, hidden_parent, ++ wh_name->len, lkup); ++ //if (LktrCond) {dput(wh_dentry); wh_dentry = ERR_PTR(-1);} ++ err = PTR_ERR(wh_dentry); ++ if (IS_ERR(wh_dentry)) ++ goto out; ++ ++ err = 0; ++ if (!wh_dentry->d_inode) ++ goto out_wh; /* success */ ++ ++ err = 1; ++ if (S_ISREG(wh_dentry->d_inode->i_mode)) ++ goto out_wh; /* success */ ++ ++ err = -EIO; ++ IOErr("%.*s Invalid whiteout entry type 0%o.\n", ++ DLNPair(wh_dentry), wh_dentry->d_inode->i_mode); ++ ++ out_wh: ++ dput(wh_dentry); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * test if the @hidden_dentry sets opaque or not. ++ */ ++int is_diropq(struct dentry *hidden_dentry, struct lkup_args *lkup) ++{ ++ int err; ++ struct inode *hidden_dir; ++ ++ LKTRTrace("dentry %.*s\n", DLNPair(hidden_dentry)); ++ hidden_dir = hidden_dentry->d_inode; ++ DEBUG_ON(!S_ISDIR(hidden_dir->i_mode)); ++ IMustLock(hidden_dir); ++ ++ err = is_wh(hidden_dentry, &diropq_name, /*try_sio*/1, lkup); ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * returns a negative dentry whose name is unique and temporary. ++ */ ++struct dentry *lkup_whtmp(struct dentry *hidden_parent, struct qstr *prefix, ++ struct lkup_args *lkup) ++{ ++#define HEX_LEN 4 ++ struct dentry *dentry; ++ int len, i; ++ char defname[AUFS_WH_PFX_LEN * 2 + DNAME_INLINE_LEN_MIN + 1 ++ + HEX_LEN + 1], *name, *p; ++ static unsigned char cnt; ++ ++ LKTRTrace("hp %.*s, prefix %.*s\n", ++ DLNPair(hidden_parent), prefix->len, prefix->name); ++ DEBUG_ON(!hidden_parent->d_inode); ++ IMustLock(hidden_parent->d_inode); ++ ++ name = defname; ++ len = sizeof(defname) - DNAME_INLINE_LEN_MIN + prefix->len - 1; ++ if (unlikely(prefix->len > DNAME_INLINE_LEN_MIN)) { ++ dentry = ERR_PTR(-ENAMETOOLONG); ++ if (unlikely(len >= PATH_MAX)) ++ goto out; ++ dentry = ERR_PTR(-ENOMEM); ++ name = kmalloc(len + 1, GFP_KERNEL); ++ //if (LktrCond) {kfree(name); name = NULL;} ++ if (unlikely(!name)) ++ goto out; ++ } ++ ++ // doubly whiteout-ed ++ memcpy(name, AUFS_WH_PFX AUFS_WH_PFX, AUFS_WH_PFX_LEN * 2); ++ p = name + AUFS_WH_PFX_LEN * 2; ++ memcpy(p, prefix->name, prefix->len); ++ p += prefix->len; ++ *p++ = '.'; ++ DEBUG_ON(name + len + 1 - p <= HEX_LEN); ++ ++ for (i = 0; i < 3; i++) { ++ sprintf(p, "%.*d", HEX_LEN, cnt++); ++ dentry = sio_lkup_one(name, hidden_parent, len, lkup); ++ //if (LktrCond) {dput(dentry); dentry = ERR_PTR(-1);} ++ if (unlikely(IS_ERR(dentry) || !dentry->d_inode)) ++ goto out_name; ++ dput(dentry); ++ } ++ //Warn("could not get random name\n"); ++ dentry = ERR_PTR(-EEXIST); ++ Dbg("%.*s\n", len, name); ++ BUG(); ++ ++ out_name: ++ if (unlikely(name != defname)) ++ kfree(name); ++ out: ++ TraceErrPtr(dentry); ++ return dentry; ++#undef HEX_LEN ++} ++ ++/* ++ * rename the @dentry of @bindex to the whiteouted temporary name. ++ */ ++int rename_whtmp(struct dentry *dentry, aufs_bindex_t bindex) ++{ ++ int err; ++ struct inode *hidden_dir; ++ struct dentry *hidden_dentry, *hidden_parent, *tmp_dentry; ++ struct super_block *sb; ++ struct lkup_args lkup; ++ ++ LKTRTrace("%.*s, b%d\n", DLNPair(dentry), bindex); ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ DEBUG_ON(!hidden_dentry || !hidden_dentry->d_inode); ++ hidden_parent = hidden_dentry->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ ++ sb = dentry->d_sb; ++ lkup.nfsmnt = au_nfsmnt(sb, bindex); ++ lkup.dlgt = need_dlgt(sb); ++ tmp_dentry = lkup_whtmp(hidden_parent, &hidden_dentry->d_name, &lkup); ++ //if (LktrCond) {dput(tmp_dentry); tmp_dentry = ERR_PTR(-1);} ++ err = PTR_ERR(tmp_dentry); ++ if (!IS_ERR(tmp_dentry)) { ++ /* under the same dir, no need to lock_rename() */ ++ err = vfsub_rename(hidden_dir, hidden_dentry, ++ hidden_dir, tmp_dentry, lkup.dlgt); ++ //if (LktrCond) err = -1; //unavailable ++ TraceErr(err); ++ dput(tmp_dentry); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++int au_unlink_wh_dentry(struct inode *hidden_dir, struct dentry *wh_dentry, ++ struct dentry *dentry, int dlgt) ++{ ++ int err; ++ ++ LKTRTrace("hi%lu, wh %.*s, d %p\n", hidden_dir->i_ino, ++ DLNPair(wh_dentry), dentry); ++ DEBUG_ON((dentry && dbwh(dentry) == -1) ++ || !wh_dentry->d_inode ++ || !S_ISREG(wh_dentry->d_inode->i_mode)); ++ IMustLock(hidden_dir); ++ ++ err = vfsub_unlink(hidden_dir, wh_dentry, dlgt); ++ //if (LktrCond) err = -1; // unavailable ++ if (!err && dentry) ++ set_dbwh(dentry, -1); ++ ++ TraceErr(err); ++ return err; ++} ++ ++static int unlink_wh_name(struct dentry *hidden_parent, struct qstr *wh, ++ struct lkup_args *lkup) ++{ ++ int err; ++ struct inode *hidden_dir; ++ struct dentry *hidden_dentry; ++ ++ LKTRTrace("%.*s/%.*s\n", DLNPair(hidden_parent), LNPair(wh)); ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ ++ // au_test_perm() is already done ++ hidden_dentry = lkup_one(wh->name, hidden_parent, wh->len, lkup); ++ //if (LktrCond) {dput(hidden_dentry); hidden_dentry = ERR_PTR(-1);} ++ if (!IS_ERR(hidden_dentry)) { ++ err = 0; ++ if (hidden_dentry->d_inode) ++ err = vfsub_unlink(hidden_dir, hidden_dentry, ++ lkup->dlgt); ++ dput(hidden_dentry); ++ } else ++ err = PTR_ERR(hidden_dentry); ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void clean_wh(struct inode *h_dir, struct dentry *wh) ++{ ++ TraceEnter(); ++ if (wh->d_inode) { ++ int err = vfsub_unlink(h_dir, wh, /*dlgt*/0); ++ if (unlikely(err)) ++ Warn("failed unlink %.*s (%d), ignored.\n", ++ DLNPair(wh), err); ++ } ++} ++ ++static void clean_plink(struct inode *h_dir, struct dentry *plink) ++{ ++ TraceEnter(); ++ if (plink->d_inode) { ++ int err = vfsub_rmdir(h_dir, plink, /*dlgt*/0); ++ if (unlikely(err)) ++ Warn("failed rmdir %.*s (%d), ignored.\n", ++ DLNPair(plink), err); ++ } ++} ++ ++static int test_linkable(struct inode *h_dir) ++{ ++ if (h_dir->i_op && h_dir->i_op->link) ++ return 0; ++ return -ENOSYS; ++} ++ ++static int plink_dir(struct inode *h_dir, struct dentry *plink) ++{ ++ int err; ++ ++ err = -EEXIST; ++ if (!plink->d_inode) { ++ int mode = S_IRWXU; ++ if (unlikely(au_is_nfs(plink->d_sb))) ++ mode |= S_IXUGO; ++ err = vfsub_mkdir(h_dir, plink, mode, /*dlgt*/0); ++ } else if (S_ISDIR(plink->d_inode->i_mode)) ++ err = 0; ++ else ++ Err("unknown %.*s exists\n", DLNPair(plink)); ++ ++ return err; ++} ++ ++/* ++ * initialize the whiteout base file/dir for @br. ++ */ ++int init_wh(struct dentry *h_root, struct aufs_branch *br, ++ struct vfsmount *nfsmnt, struct super_block *sb) ++{ ++ int err; ++ struct dentry *wh, *plink; ++ struct inode *h_dir; ++ static struct qstr base_name[] = { ++ {.name = AUFS_WH_BASENAME, .len = sizeof(AUFS_WH_BASENAME) - 1}, ++ {.name = AUFS_WH_PLINKDIR, .len = sizeof(AUFS_WH_PLINKDIR) - 1} ++ }; ++ struct lkup_args lkup = { ++ .nfsmnt = nfsmnt, ++ .dlgt = 0 // always no dlgt ++ }; ++ const int do_plink = au_flag_test(sb, AuFlag_PLINK); ++ ++ LKTRTrace("nfsmnt %p\n", nfsmnt); ++ BrWhMustWriteLock(br); ++ SiMustWriteLock(sb); ++ h_dir = h_root->d_inode; ++ IMustLock(h_dir); ++ ++ // doubly whiteouted ++ wh = lkup_wh(h_root, base_name + 0, &lkup); ++ //if (LktrCond) {dput(wh); wh = ERR_PTR(-1);} ++ err = PTR_ERR(wh); ++ if (IS_ERR(wh)) ++ goto out; ++ DEBUG_ON(br->br_wh && br->br_wh != wh); ++ ++ plink = lkup_wh(h_root, base_name + 1, &lkup); ++ err = PTR_ERR(plink); ++ if (IS_ERR(plink)) ++ goto out_dput_wh; ++ DEBUG_ON(br->br_plink && br->br_plink != plink); ++ ++ dput(br->br_wh); ++ dput(br->br_plink); ++ br->br_wh = br->br_plink = NULL; ++ ++ err = 0; ++ switch (br->br_perm) { ++ case AuBr_RR: ++ case AuBr_RO: ++ case AuBr_RRWH: ++ case AuBr_ROWH: ++ clean_wh(h_dir, wh); ++ clean_plink(h_dir, plink); ++ break; ++ ++ case AuBr_RWNoLinkWH: ++ clean_wh(h_dir, wh); ++ if (do_plink) { ++ err = test_linkable(h_dir); ++ if (unlikely(err)) ++ goto out_nolink; ++ ++ err = plink_dir(h_dir, plink); ++ if (unlikely(err)) ++ goto out_err; ++ br->br_plink = dget(plink); ++ } else ++ clean_plink(h_dir, plink); ++ break; ++ ++ case AuBr_RW: ++ /* ++ * for the moment, aufs supports the branch filesystem ++ * which does not support link(2). ++ * testing on FAT which does not support i_op->setattr() fully either, ++ * copyup failed. ++ * finally, such filesystem will not be used as the writable branch. ++ */ ++ err = test_linkable(h_dir); ++ if (unlikely(err)) ++ goto out_nolink; ++ ++ err = -EEXIST; ++ if (!wh->d_inode) ++ err = vfsub_create(h_dir, wh, WH_MASK, NULL, /*dlgt*/0); ++ else if (S_ISREG(wh->d_inode->i_mode)) ++ err = 0; ++ else ++ Err("unknown %.*s/%.*s exists\n", ++ DLNPair(h_root), DLNPair(wh)); ++ if (unlikely(err)) ++ goto out_err; ++ ++ if (do_plink) { ++ err = plink_dir(h_dir, plink); ++ if (unlikely(err)) ++ goto out_err; ++ br->br_plink = dget(plink); ++ } else ++ clean_plink(h_dir, plink); ++ br->br_wh = dget(wh); ++ break; ++ ++ default: ++ BUG(); ++ } ++ ++ out_dput: ++ dput(plink); ++ out_dput_wh: ++ dput(wh); ++ out: ++ TraceErr(err); ++ return err; ++ out_nolink: ++ Err("%.*s doesn't support link(2), use noplink and rw+nolwh\n", ++ DLNPair(h_root)); ++ goto out_dput; ++ out_err: ++ Err("an error(%d) on the writable branch %.*s(%s)\n", ++ err, DLNPair(h_root), au_sbtype(h_root->d_sb)); ++ goto out_dput; ++} ++ ++struct reinit_br_wh { ++ struct super_block *sb; ++ struct aufs_branch *br; ++}; ++ ++static void reinit_br_wh(void *arg) ++{ ++ int err; ++ struct reinit_br_wh *a = arg; ++ struct inode *hidden_dir, *dir; ++ struct dentry *hidden_root; ++ aufs_bindex_t bindex; ++ ++ TraceEnter(); ++ DEBUG_ON(!a->br->br_wh || !a->br->br_wh->d_inode || current->fsuid); ++ ++ err = 0; ++ /* big lock */ ++ si_write_lock(a->sb); ++ if (unlikely(!br_writable(a->br->br_perm))) ++ goto out; ++ bindex = find_brindex(a->sb, a->br->br_id); ++ if (unlikely(bindex < 0)) ++ goto out; ++ ++ dir = a->sb->s_root->d_inode; ++ hidden_root = a->br->br_wh->d_parent; ++ hidden_dir = hidden_root->d_inode; ++ DEBUG_ON(!hidden_dir->i_op || !hidden_dir->i_op->link); ++ hdir_lock(hidden_dir, dir, bindex); ++ br_wh_write_lock(a->br); ++ err = vfsub_unlink(hidden_dir, a->br->br_wh, /*dlgt*/0); ++ //if (LktrCond) err = -1; ++ dput(a->br->br_wh); ++ a->br->br_wh = NULL; ++ if (!err) ++ err = init_wh(hidden_root, a->br, au_do_nfsmnt(a->br->br_mnt), ++ a->sb); ++ br_wh_write_unlock(a->br); ++ hdir_unlock(hidden_dir, dir, bindex); ++ ++ out: ++ atomic_dec(&a->br->br_wh_running); ++ br_put(a->br); ++ si_write_unlock(a->sb); ++ au_mntput(a->sb); ++ kfree(arg); ++ if (unlikely(err)) ++ IOErr("err %d\n", err); ++} ++ ++static void kick_reinit_br_wh(struct super_block *sb, struct aufs_branch *br) ++{ ++ int do_dec; ++ struct reinit_br_wh *arg; ++ ++ do_dec = 1; ++ if (atomic_inc_return(&br->br_wh_running) != 1) ++ goto out; ++ ++ // ignore ENOMEM ++ arg = kmalloc(sizeof(*arg), GFP_KERNEL); ++ if (arg) { ++ // dec(wh_running), kfree(arg) and br_put() in reinit function ++ arg->sb = sb; ++ arg->br = br; ++ br_get(br); ++ /* prohibit umount */ ++ au_mntget(sb); ++ au_wkq_nowait(reinit_br_wh, arg, /*dlgt*/0); ++ do_dec = 0; ++ } ++ ++ out: ++ if (do_dec) ++ atomic_dec(&br->br_wh_running); ++} ++ ++/* ++ * create the whiteoute @wh. ++ */ ++static int link_or_create_wh(struct dentry *wh, struct super_block *sb, ++ aufs_bindex_t bindex) ++{ ++ int err, dlgt; ++ struct aufs_branch *br; ++ struct dentry *hidden_parent; ++ struct inode *hidden_dir; ++ ++ LKTRTrace("%.*s\n", DLNPair(wh)); ++ SiMustReadLock(sb); ++ hidden_parent = wh->d_parent; ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ ++ dlgt = need_dlgt(sb); ++ br = stobr(sb, bindex); ++ br_wh_read_lock(br); ++ if (br->br_wh) { ++ err = vfsub_link(br->br_wh, hidden_dir, wh, dlgt); ++ if (!err || err != -EMLINK) ++ goto out; ++ ++ // link count full. re-initialize br_wh. ++ kick_reinit_br_wh(sb, br); ++ } ++ ++ // return this error in this context ++ err = vfsub_create(hidden_dir, wh, WH_MASK, NULL, dlgt); ++ ++ out: ++ br_wh_read_unlock(br); ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * create or remove the diropq. ++ */ ++static struct dentry *do_diropq(struct dentry *dentry, aufs_bindex_t bindex, ++ int do_create, int dlgt) ++{ ++ struct dentry *opq_dentry, *hidden_dentry; ++ struct inode *hidden_dir; ++ int err; ++ struct super_block *sb; ++ struct lkup_args lkup; ++ ++ LKTRTrace("%.*s, bindex %d, do_create %d\n", DLNPair(dentry), ++ bindex, do_create); ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ DEBUG_ON(!hidden_dentry); ++ hidden_dir = hidden_dentry->d_inode; ++ DEBUG_ON(!hidden_dir || !S_ISDIR(hidden_dir->i_mode)); ++ IMustLock(hidden_dir); ++ ++ // already checked by au_test_perm(). ++ sb = dentry->d_sb; ++ lkup.nfsmnt = au_nfsmnt(sb, bindex); ++ lkup.dlgt = dlgt; ++ opq_dentry = lkup_one(diropq_name.name, hidden_dentry, diropq_name.len, ++ &lkup); ++ //if (LktrCond) {dput(opq_dentry); opq_dentry = ERR_PTR(-1);} ++ if (IS_ERR(opq_dentry)) ++ goto out; ++ ++ if (do_create) { ++ DEBUG_ON(opq_dentry->d_inode); ++ err = link_or_create_wh(opq_dentry, sb, bindex); ++ //if (LktrCond) {vfs_unlink(hidden_dir, opq_dentry); err = -1;} ++ if (!err) { ++ set_dbdiropq(dentry, bindex); ++ goto out; /* success */ ++ } ++ } else { ++ DEBUG_ON(/* !S_ISDIR(dentry->d_inode->i_mode) ++ * || */!opq_dentry->d_inode); ++ err = vfsub_unlink(hidden_dir, opq_dentry, lkup.dlgt); ++ //if (LktrCond) err = -1; ++ if (!err) ++ set_dbdiropq(dentry, -1); ++ } ++ dput(opq_dentry); ++ opq_dentry = ERR_PTR(err); ++ ++ out: ++ TraceErrPtr(opq_dentry); ++ return opq_dentry; ++} ++ ++struct do_diropq_args { ++ struct dentry **errp; ++ struct dentry *dentry; ++ aufs_bindex_t bindex; ++ int do_create, dlgt; ++}; ++ ++static void call_do_diropq(void *args) ++{ ++ struct do_diropq_args *a = args; ++ *a->errp = do_diropq(a->dentry, a->bindex, a->do_create, a->dlgt); ++} ++ ++struct dentry *sio_diropq(struct dentry *dentry, aufs_bindex_t bindex, ++ int do_create, int dlgt) ++{ ++ struct dentry *diropq, *hidden_dentry; ++ ++ LKTRTrace("%.*s, bindex %d, do_create %d\n", ++ DLNPair(dentry), bindex, do_create); ++ ++ hidden_dentry = au_h_dptr_i(dentry, bindex); ++ if (!au_test_perm(hidden_dentry->d_inode, MAY_EXEC | MAY_WRITE, dlgt)) ++ diropq = do_diropq(dentry, bindex, do_create, dlgt); ++ else { ++ struct do_diropq_args args = { ++ .errp = &diropq, ++ .dentry = dentry, ++ .bindex = bindex, ++ .do_create = do_create, ++ .dlgt = dlgt ++ }; ++ au_wkq_wait(call_do_diropq, &args, /*dlgt*/0); ++ } ++ ++ TraceErrPtr(diropq); ++ return diropq; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * lookup whiteout dentry. ++ * @hidden_parent: hidden parent dentry which must exist and be locked ++ * @base_name: name of dentry which will be whiteouted ++ * returns dentry for whiteout. ++ */ ++struct dentry *lkup_wh(struct dentry *hidden_parent, struct qstr *base_name, ++ struct lkup_args *lkup) ++{ ++ int err; ++ struct qstr wh_name; ++ struct dentry *wh_dentry; ++ ++ LKTRTrace("%.*s/%.*s\n", DLNPair(hidden_parent), LNPair(base_name)); ++ IMustLock(hidden_parent->d_inode); ++ ++ err = au_alloc_whname(base_name->name, base_name->len, &wh_name); ++ //if (LktrCond) {au_free_whname(&wh_name); err = -1;} ++ wh_dentry = ERR_PTR(err); ++ if (!err) { ++ // do not superio. ++ wh_dentry = lkup_one(wh_name.name, hidden_parent, wh_name.len, ++ lkup); ++ au_free_whname(&wh_name); ++ } ++ TraceErrPtr(wh_dentry); ++ return wh_dentry; ++} ++ ++/* ++ * link/create a whiteout for @dentry on @bindex. ++ */ ++struct dentry *simple_create_wh(struct dentry *dentry, aufs_bindex_t bindex, ++ struct dentry *hidden_parent, ++ struct lkup_args *lkup) ++{ ++ struct dentry *wh_dentry; ++ int err; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s/%.*s on b%d\n", DLNPair(hidden_parent), ++ DLNPair(dentry), bindex); ++ ++ sb = dentry->d_sb; ++ wh_dentry = lkup_wh(hidden_parent, &dentry->d_name, lkup); ++ //au_nfsmnt(sb, bindex), need_dlgt(sb)); ++ //if (LktrCond) {dput(wh_dentry); wh_dentry = ERR_PTR(-1);} ++ if (!IS_ERR(wh_dentry) && !wh_dentry->d_inode) { ++ IMustLock(hidden_parent->d_inode); ++ err = link_or_create_wh(wh_dentry, sb, bindex); ++ if (!err) ++ set_dbwh(dentry, bindex); ++ else { ++ dput(wh_dentry); ++ wh_dentry = ERR_PTR(err); ++ } ++ } ++ ++ TraceErrPtr(wh_dentry); ++ return wh_dentry; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* Delete all whiteouts in this directory in branch bindex. */ ++static int del_wh_children(struct aufs_nhash *whlist, ++ struct dentry *hidden_parent, aufs_bindex_t bindex, ++ struct lkup_args *lkup) ++{ ++ int err, i; ++ struct qstr wh_name; ++ char *p; ++ struct inode *hidden_dir; ++ struct hlist_head *head; ++ struct aufs_wh *tpos; ++ struct hlist_node *pos; ++ struct aufs_destr *str; ++ ++ LKTRTrace("%.*s\n", DLNPair(hidden_parent)); ++ hidden_dir = hidden_parent->d_inode; ++ IMustLock(hidden_dir); ++ DEBUG_ON(IS_RDONLY(hidden_dir)); ++ //SiMustReadLock(??); ++ ++ err = -ENOMEM; ++ wh_name.name = p = __getname(); ++ //if (LktrCond) {__putname(p); wh_name.name = p = NULL;} ++ if (unlikely(!wh_name.name)) ++ goto out; ++ memcpy(p, AUFS_WH_PFX, AUFS_WH_PFX_LEN); ++ p += AUFS_WH_PFX_LEN; ++ ++ // already checked by au_test_perm(). ++ err = 0; ++ for (i = 0; !err && i < AUFS_NHASH_SIZE; i++) { ++ head = whlist->heads + i; ++ hlist_for_each_entry(tpos, pos, head, wh_hash) { ++ if (tpos->wh_bindex != bindex) ++ continue; ++ str = &tpos->wh_str; ++ if (str->len + AUFS_WH_PFX_LEN <= PATH_MAX) { ++ memcpy(p, str->name, str->len); ++ wh_name.len = AUFS_WH_PFX_LEN + str->len; ++ err = unlink_wh_name(hidden_parent, &wh_name, ++ lkup); ++ //if (LktrCond) err = -1; ++ if (!err) ++ continue; ++ break; ++ } ++ IOErr("whiteout name too long %.*s\n", ++ str->len, str->name); ++ err = -EIO; ++ break; ++ } ++ } ++ __putname(wh_name.name); ++ ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++struct del_wh_children_args { ++ int *errp; ++ struct aufs_nhash *whlist; ++ struct dentry *hidden_parent; ++ aufs_bindex_t bindex; ++ struct lkup_args *lkup; ++}; ++ ++static void call_del_wh_children(void *args) ++{ ++ struct del_wh_children_args *a = args; ++ *a->errp = del_wh_children(a->whlist, a->hidden_parent, a->bindex, ++ a->lkup); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * rmdir the whiteouted temporary named dir @hidden_dentry. ++ * @whlist: whiteouted children. ++ */ ++int rmdir_whtmp(struct dentry *hidden_dentry, struct aufs_nhash *whlist, ++ aufs_bindex_t bindex, struct inode *dir, struct inode *inode) ++{ ++ int err; ++ struct inode *hidden_inode, *hidden_dir; ++ struct lkup_args lkup; ++ struct super_block *sb; ++ ++ LKTRTrace("hd %.*s, b%d, i%lu\n", ++ DLNPair(hidden_dentry), bindex, dir->i_ino); ++ IMustLock(dir); ++ IiMustAnyLock(dir); ++ hidden_dir = hidden_dentry->d_parent->d_inode; ++ IMustLock(hidden_dir); ++ ++ sb = inode->i_sb; ++ lkup.nfsmnt = au_nfsmnt(sb, bindex); ++ lkup.dlgt = need_dlgt(sb); ++ hidden_inode = hidden_dentry->d_inode; ++ DEBUG_ON(hidden_inode != au_h_iptr_i(inode, bindex)); ++ hdir2_lock(hidden_inode, inode, bindex); ++ if (!au_test_perm(hidden_inode, MAY_EXEC | MAY_WRITE, lkup.dlgt)) ++ err = del_wh_children(whlist, hidden_dentry, bindex, &lkup); ++ else { ++ // ugly ++ int dlgt = lkup.dlgt; ++ struct del_wh_children_args args = { ++ .errp = &err, ++ .whlist = whlist, ++ .hidden_parent = hidden_dentry, ++ .bindex = bindex, ++ .lkup = &lkup ++ }; ++ ++ lkup.dlgt = 0; ++ au_wkq_wait(call_del_wh_children, &args, /*dlgt*/0); ++ lkup.dlgt = dlgt; ++ } ++ hdir_unlock(hidden_inode, inode, bindex); ++ ++ if (!err) { ++ err = vfsub_rmdir(hidden_dir, hidden_dentry, lkup.dlgt); ++ //d_drop(hidden_dentry); ++ //if (LktrCond) err = -1; ++ } ++ ++ if (!err) { ++ if (ibstart(dir) == bindex) { ++ au_cpup_attr_timesizes(dir); ++ //au_cpup_attr_nlink(dir); ++ dir->i_nlink--; ++ } ++ return 0; /* success */ ++ } ++ ++ Warn("failed removing %.*s(%d), ignored\n", ++ DLNPair(hidden_dentry), err); ++ return err; ++} ++ ++static void do_rmdir_whtmp(void *arg) ++{ ++ int err; ++ struct rmdir_whtmp_arg *a = arg; ++ struct super_block *sb; ++ ++ LKTRTrace("%.*s, b%d, dir i%lu\n", ++ DLNPair(a->h_dentry), a->bindex, a->dir->i_ino); ++ ++ i_lock(a->dir); ++ sb = a->dir->i_sb; ++ si_read_lock(sb); ++ err = test_ro(sb, a->bindex, NULL); ++ if (!err) { ++ struct inode *hidden_dir = a->h_dentry->d_parent->d_inode; ++ ++ ii_write_lock_child(a->inode); ++ ii_write_lock_parent(a->dir); ++ hdir_lock(hidden_dir, a->dir, a->bindex); ++ err = rmdir_whtmp(a->h_dentry, &a->whlist, a->bindex, ++ a->dir, a->inode); ++ hdir_unlock(hidden_dir, a->dir, a->bindex); ++ ii_write_unlock(a->dir); ++ ii_write_unlock(a->inode); ++ } ++ dput(a->h_dentry); ++ nhash_fin(&a->whlist); ++ iput(a->inode); ++ si_read_unlock(sb); ++ au_mntput(sb); ++ i_unlock(a->dir); ++ iput(a->dir); ++ kfree(arg); ++ if (unlikely(err)) ++ IOErr("err %d\n", err); ++} ++ ++void kick_rmdir_whtmp(struct dentry *hidden_dentry, struct aufs_nhash *whlist, ++ aufs_bindex_t bindex, struct inode *dir, ++ struct inode *inode, struct rmdir_whtmp_arg *arg) ++{ ++ LKTRTrace("%.*s\n", DLNPair(hidden_dentry)); ++ IMustLock(dir); ++ ++ // all post-process will be done in do_rmdir_whtmp(). ++ arg->h_dentry = dget(hidden_dentry); ++ nhash_init(&arg->whlist); ++ nhash_move(&arg->whlist, whlist); ++ arg->bindex = bindex; ++ arg->dir = igrab(dir); ++ arg->inode = igrab(inode); ++ /* prohibit umount */ ++ au_mntget(dir->i_sb); ++ ++ au_wkq_nowait(do_rmdir_whtmp, arg, /*dlgt*/0); ++} +diff --git a/fs/aufs/whout.h b/fs/aufs/whout.h +new file mode 100755 +index 0000000..d44c3cd +--- /dev/null ++++ b/fs/aufs/whout.h +@@ -0,0 +1,87 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: whout.h,v 1.8 2007/05/14 03:41:52 sfjro Exp $ */ ++ ++#ifndef __AUFS_WHOUT_H__ ++#define __AUFS_WHOUT_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/fs.h> ++#include <linux/aufs_type.h> ++ ++int au_alloc_whname(const char *name, int len, struct qstr *wh); ++void au_free_whname(struct qstr *wh); ++ ++struct lkup_args; ++int is_wh(struct dentry *h_parent, struct qstr *wh_name, int try_sio, ++ struct lkup_args *lkup); ++int is_diropq(struct dentry *h_dentry, struct lkup_args *lkup); ++ ++struct dentry *lkup_whtmp(struct dentry *h_parent, struct qstr *prefix, ++ struct lkup_args *lkup); ++int rename_whtmp(struct dentry *dentry, aufs_bindex_t bindex); ++int au_unlink_wh_dentry(struct inode *h_dir, struct dentry *wh_dentry, ++ struct dentry *dentry, int dlgt); ++ ++struct aufs_branch; ++int init_wh(struct dentry *h_parent, struct aufs_branch *br, ++ struct vfsmount *nfsmnt, struct super_block *sb); ++ ++struct dentry *sio_diropq(struct dentry *dentry, aufs_bindex_t bindex, ++ int do_create, int dlgt); ++ ++struct dentry *lkup_wh(struct dentry *h_parent, struct qstr *base_name, ++ struct lkup_args *lkup); ++struct dentry *simple_create_wh(struct dentry *dentry, aufs_bindex_t bindex, ++ struct dentry *h_parent, ++ struct lkup_args *lkup); ++ ++/* real rmdir the whiteout-ed dir */ ++struct rmdir_whtmp_arg { ++ struct dentry *h_dentry; ++ struct aufs_nhash whlist; ++ aufs_bindex_t bindex; ++ struct inode *dir, *inode; ++}; ++ ++struct aufs_nhash; ++int rmdir_whtmp(struct dentry *h_dentry, struct aufs_nhash *whlist, ++ aufs_bindex_t bindex, struct inode *dir, struct inode *inode); ++void kick_rmdir_whtmp(struct dentry *h_dentry, struct aufs_nhash *whlist, ++ aufs_bindex_t bindex, struct inode *dir, ++ struct inode *inode, struct rmdir_whtmp_arg *arg); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline ++struct dentry *create_diropq(struct dentry *dentry, aufs_bindex_t bindex, ++ int dlgt) ++{ ++ return sio_diropq(dentry, bindex, 1, dlgt); ++} ++ ++static inline ++int remove_diropq(struct dentry *dentry, aufs_bindex_t bindex, int dlgt) ++{ ++ return PTR_ERR(sio_diropq(dentry, bindex, 0, dlgt)); ++} ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_WHOUT_H__ */ +diff --git a/fs/aufs/wkq.c b/fs/aufs/wkq.c +new file mode 100755 +index 0000000..b5ab023 +--- /dev/null ++++ b/fs/aufs/wkq.c +@@ -0,0 +1,283 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: wkq.c,v 1.14 2007/05/14 03:39:10 sfjro Exp $ */ ++ ++#include <linux/module.h> ++#include "aufs.h" ++ ++struct au_wkq *au_wkq; ++ ++struct au_cred { ++#ifdef CONFIG_AUFS_DLGT ++ uid_t fsuid; ++ gid_t fsgid; ++ kernel_cap_t cap_effective, cap_inheritable, cap_permitted; ++ //unsigned keep_capabilities:1; ++ //struct user_struct *user; ++ //struct fs_struct *fs; ++ //struct nsproxy *nsproxy; ++#endif ++}; ++ ++struct au_wkinfo { ++ struct work_struct wk; ++ ++ unsigned int wait:1; ++ unsigned int dlgt:1; ++ struct au_cred cred; ++ ++ au_wkq_func_t func; ++ void *args; ++ ++ atomic_t *busyp; ++ struct completion *comp; ++}; ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_DLGT ++static void cred_store(struct au_cred *cred) ++{ ++ cred->fsuid = current->fsuid; ++ cred->fsgid = current->fsgid; ++ cred->cap_effective = current->cap_effective; ++ cred->cap_inheritable = current->cap_inheritable; ++ cred->cap_permitted = current->cap_permitted; ++} ++ ++static void cred_revert(struct au_cred *cred) ++{ ++ DEBUG_ON(!is_au_wkq(current)); ++ current->fsuid = cred->fsuid; ++ current->fsgid = cred->fsgid; ++ current->cap_effective = cred->cap_effective; ++ current->cap_inheritable = cred->cap_inheritable; ++ current->cap_permitted = cred->cap_permitted; ++} ++ ++static void cred_switch(struct au_cred *old, struct au_cred *new) ++{ ++ cred_store(old); ++ cred_revert(new); ++} ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++static void update_busy(struct au_wkq *wkq, struct au_wkinfo *wkinfo) ++{ ++#ifdef CONFIG_AUFS_SYSAUFS ++ unsigned int new, old; ++ ++ do { ++ new = atomic_read(wkinfo->busyp); ++ old = wkq->max_busy; ++ if (new <= old) ++ break; ++ } while (cmpxchg(&wkq->max_busy, old, new) == old); ++#endif ++} ++ ++static int enqueue(struct au_wkq *wkq, struct au_wkinfo *wkinfo) ++{ ++ wkinfo->busyp = &wkq->busy; ++ update_busy(wkq, wkinfo); ++ if (wkinfo->wait) ++ return !queue_work(wkq->q, &wkinfo->wk); ++ else ++ return !schedule_work(&wkinfo->wk); ++} ++ ++static void do_wkq(struct au_wkinfo *wkinfo) ++{ ++ unsigned int idle, n; ++ int i, idle_idx; ++ ++ TraceEnter(); ++ ++ while (1) { ++ if (wkinfo->wait) { ++ idle_idx = 0; ++ idle = UINT_MAX; ++ for (i = 0; i < aufs_nwkq; i++) { ++ n = atomic_inc_return(&au_wkq[i].busy); ++ if (n == 1 && !enqueue(au_wkq + i, wkinfo)) ++ return; /* success */ ++ ++ if (n < idle) { ++ idle_idx = i; ++ idle = n; ++ } ++ atomic_dec(&au_wkq[i].busy); ++ } ++ } else ++ idle_idx = aufs_nwkq; ++ ++ atomic_inc(&au_wkq[idle_idx].busy); ++ if (!enqueue(au_wkq + idle_idx, wkinfo)) ++ return; /* success */ ++ ++ /* impossible? */ ++ Warn1("failed to queue_work()\n"); ++ yield(); ++ } ++} ++ ++static AuWkqFunc(wkq_func, wk) ++{ ++ struct au_wkinfo *wkinfo = container_of(wk, struct au_wkinfo, wk); ++ ++ LKTRTrace("wkinfo{%u, %u, %p, %p, %p}\n", ++ wkinfo->wait, wkinfo->dlgt, wkinfo->func, wkinfo->busyp, ++ wkinfo->comp); ++#ifdef CONFIG_AUFS_DLGT ++ if (!wkinfo->dlgt) ++ wkinfo->func(wkinfo->args); ++ else { ++ struct au_cred cred; ++ cred_switch(&cred, &wkinfo->cred); ++ wkinfo->func(wkinfo->args); ++ cred_revert(&cred); ++ } ++#else ++ wkinfo->func(wkinfo->args); ++#endif ++ atomic_dec(wkinfo->busyp); ++ if (wkinfo->wait) ++ complete(wkinfo->comp); ++ else { ++ kfree(wkinfo); ++ module_put(THIS_MODULE); ++ } ++} ++ ++void au_wkq_run(au_wkq_func_t func, void *args, int dlgt, int do_wait) ++{ ++ DECLARE_COMPLETION_ONSTACK(comp); ++ struct au_wkinfo _wkinfo = { ++ .wait = 1, ++ .dlgt = !!dlgt, ++ .func = func, ++ .args = args, ++ .comp = &comp ++ }, *wkinfo = &_wkinfo; ++ ++ LKTRTrace("dlgt %d, do_wait %d\n", dlgt, do_wait); ++ DEBUG_ON(is_au_wkq(current)); ++ ++ if (unlikely(!do_wait)) { ++ static DECLARE_WAIT_QUEUE_HEAD(wq); ++ /* ++ * never fail. ++ * wkq_func() must free this wkinfo. ++ * it highly depends upon the implementation of workqueue. ++ */ ++ wait_event(wq, (wkinfo = kmalloc(sizeof(*wkinfo), GFP_KERNEL))); ++ wkinfo->wait = 0; ++ wkinfo->dlgt = !!dlgt; ++ wkinfo->func = func; ++ wkinfo->args = args; ++ wkinfo->comp = NULL; ++ __module_get(THIS_MODULE); ++ } ++ ++ AuInitWkq(&wkinfo->wk, wkq_func); ++#ifdef CONFIG_AUFS_DLGT ++ if (dlgt) ++ cred_store(&wkinfo->cred); ++#endif ++ do_wkq(wkinfo); ++ if (do_wait) ++ wait_for_completion(wkinfo->comp); ++} ++ ++#if 0 ++void au_wkq_wait_nwtask(void) ++{ ++ static DECLARE_WAIT_QUEUE_HEAD(wq); ++ wait_event(wq, !atomic_read(&au_wkq[aufs_nwkq].busy)); ++} ++#endif ++ ++void au_wkq_fin(void) ++{ ++ int i; ++ ++ TraceEnter(); ++ ++ for (i = 0; i < aufs_nwkq; i++) ++ if (au_wkq[i].q && !IS_ERR(au_wkq[i].q)) ++ destroy_workqueue(au_wkq[i].q); ++ kfree(au_wkq); ++} ++ ++int __init au_wkq_init(void) ++{ ++ int err, i; ++ struct au_wkq *nowaitq; ++ ++ LKTRTrace("%d\n", aufs_nwkq); ++ ++ /* '+1' is for accounting of nowait queue */ ++ err = -ENOMEM; ++ au_wkq = kcalloc(aufs_nwkq + 1, sizeof(*au_wkq), GFP_KERNEL); ++ if (unlikely(!au_wkq)) ++ goto out; ++ ++ err = 0; ++ for (i = 0; i < aufs_nwkq; i++) { ++ au_wkq[i].q = create_singlethread_workqueue(AUFS_WKQ_NAME); ++ if (au_wkq[i].q && !IS_ERR(au_wkq[i].q)) { ++ atomic_set(&au_wkq[i].busy, 0); ++ au_wkq[i].max_busy = 0; ++ continue; ++ } ++ ++ err = PTR_ERR(au_wkq[i].q); ++ au_wkq_fin(); ++ break; ++ } ++ ++ /* nowait accounting */ ++ nowaitq = au_wkq + aufs_nwkq; ++ atomic_set(&nowaitq->busy, 0); ++ nowaitq->max_busy = 0; ++ nowaitq->q = NULL; ++ ++#if 0 // test accouting ++ if (!err) { ++ static void f(void *args) { ++ DbgSleep(1); ++ } ++ int i; ++ //au_debug_on(); ++ LKTRTrace("f %p\n", f); ++ for (i = 0; i < 10; i++) ++ au_wkq_nowait(f, NULL, 0); ++ for (i = 0; i < aufs_nwkq; i++) ++ au_wkq_wait(f, NULL, 0); ++ DbgSleep(11); ++ //au_debug_off(); ++ } ++#endif ++ ++ out: ++ TraceErr(err); ++ return err; ++} +diff --git a/fs/aufs/wkq.h b/fs/aufs/wkq.h +new file mode 100755 +index 0000000..cc1bb25 +--- /dev/null ++++ b/fs/aufs/wkq.h +@@ -0,0 +1,81 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: wkq.h,v 1.9 2007/05/14 03:39:10 sfjro Exp $ */ ++ ++#ifndef __AUFS_WKQ_H__ ++#define __AUFS_WKQ_H__ ++ ++#ifdef __KERNEL__ ++ ++#include <linux/sched.h> ++#include <linux/version.h> ++#include <linux/workqueue.h> ++ ++#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,18) ++#define DECLARE_COMPLETION_ONSTACK(work) DECLARE_COMPLETION(work) ++#endif ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* internal workqueue named AUFS_WKQ_NAME */ ++struct au_wkq { ++ struct workqueue_struct *q; ++ ++ /* accounting */ ++ atomic_t busy; ++ unsigned int max_busy; ++} ;//__attribute__ ((aligned)); ++ ++typedef void (*au_wkq_func_t)(void *args); ++ ++#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20) ++#define AuInitWkq(wk, func) INIT_WORK(wk, func) ++#define AuWkqFunc(name, arg) void name(struct work_struct *arg) ++#else ++typedef void (*work_func_t)(void *arg); ++#define AuInitWkq(wk, func) INIT_WORK(wk, func, wk) ++#define AuWkqFunc(name, arg) void name(void *arg) ++#endif ++ ++extern struct au_wkq *au_wkq; ++ ++void au_wkq_run(au_wkq_func_t func, void *args, int dlgt, int do_wait); ++//void au_wkq_wait_nwtask(void); ++int __init au_wkq_init(void); ++void au_wkq_fin(void); ++ ++/* ---------------------------------------------------------------------- */ ++ ++static inline int is_au_wkq(struct task_struct *tsk) ++{ ++ return (!tsk->mm && !strcmp(current->comm, AUFS_WKQ_NAME)); ++} ++ ++static inline void au_wkq_wait(au_wkq_func_t func, void *args, int dlgt) ++{ ++ au_wkq_run(func, args, dlgt, /*do_wait*/1); ++} ++ ++static inline void au_wkq_nowait(au_wkq_func_t func, void *args, int dlgt) ++{ ++ au_wkq_run(func, args, dlgt, /*do_wait*/0); ++} ++ ++#endif /* __KERNEL__ */ ++#endif /* __AUFS_WKQ_H__ */ +diff --git a/fs/aufs/xino.c b/fs/aufs/xino.c +new file mode 100755 +index 0000000..145491e +--- /dev/null ++++ b/fs/aufs/xino.c +@@ -0,0 +1,644 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: xino.c,v 1.27 2007/05/14 03:39:10 sfjro Exp $ */ ++ ++//#include <linux/fs.h> ++#include <linux/fsnotify.h> ++#include <asm/uaccess.h> ++#include "aufs.h" ++ ++static readf_t find_readf(struct file *h_file) ++{ ++ const struct file_operations *fop = h_file->f_op; ++ ++ if (fop) { ++ if (fop->read) ++ return fop->read; ++ if (fop->aio_read) ++ return do_sync_read; ++ } ++ return ERR_PTR(-ENOSYS); ++} ++ ++static writef_t find_writef(struct file *h_file) ++{ ++ const struct file_operations *fop = h_file->f_op; ++ ++ if (fop) { ++ if (fop->write) ++ return fop->write; ++ if (fop->aio_write) ++ return do_sync_write; ++ } ++ return ERR_PTR(-ENOSYS); ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static ssize_t xino_fread(readf_t func, struct file *file, void *buf, ++ size_t size, loff_t *pos) ++{ ++ ssize_t err; ++ mm_segment_t oldfs; ++ ++ LKTRTrace("%.*s, sz %lu, *pos %Ld\n", ++ DLNPair(file->f_dentry), (unsigned long)size, *pos); ++ ++ oldfs = get_fs(); ++ set_fs(KERNEL_DS); ++ do { ++ err = func(file, (char __user*)buf, size, pos); ++ } while (err == -EAGAIN || err == -EINTR); ++ set_fs(oldfs); ++ ++#if 0 ++ if (err > 0) ++ fsnotify_access(file->f_dentry); ++#endif ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++static ssize_t do_xino_fwrite(writef_t func, struct file *file, void *buf, ++ size_t size, loff_t *pos) ++{ ++ ssize_t err; ++ mm_segment_t oldfs; ++ ++ lockdep_off(); ++ oldfs = get_fs(); ++ set_fs(KERNEL_DS); ++ do { ++ err = func(file, (const char __user*)buf, size, pos); ++ } while (err == -EAGAIN || err == -EINTR); ++ set_fs(oldfs); ++ lockdep_on(); ++ ++#if 0 ++ if (err > 0) ++ fsnotify_modify(file->f_dentry); ++#endif ++ ++ TraceErr(err); ++ return err; ++} ++ ++struct do_xino_fwrite_args { ++ ssize_t *errp; ++ writef_t func; ++ struct file *file; ++ void *buf; ++ size_t size; ++ loff_t *pos; ++}; ++ ++static void call_do_xino_fwrite(void *args) ++{ ++ struct do_xino_fwrite_args *a = args; ++ *a->errp = do_xino_fwrite(a->func, a->file, a->buf, a->size, a->pos); ++} ++ ++static ssize_t xino_fwrite(writef_t func, struct file *file, void *buf, ++ size_t size, loff_t *pos) ++{ ++ ssize_t err; ++ ++ LKTRTrace("%.*s, sz %lu, *pos %Ld\n", ++ DLNPair(file->f_dentry), (unsigned long)size, *pos); ++ ++ // signal block and no wkq? ++ /* ++ * it breaks RLIMIT_FSIZE and normal user's limit, ++ * users should care about quota and real 'filesystem full.' ++ */ ++ if (!is_au_wkq(current)) { ++ struct do_xino_fwrite_args args = { ++ .errp = &err, ++ .func = func, ++ .file = file, ++ .buf = buf, ++ .size = size, ++ .pos = pos ++ }; ++ au_wkq_wait(call_do_xino_fwrite, &args, /*dlgt*/0); ++ } else ++ err = do_xino_fwrite(func, file, buf, size, pos); ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ++ * write @ino to the xinofile for the specified branch{@sb, @bindex} ++ * at the position of @_ino. ++ * when @ino is zero, it is written to the xinofile and means no entry. ++ */ ++int xino_write(struct super_block *sb, aufs_bindex_t bindex, ino_t h_ino, ++ struct xino *xino) ++{ ++ struct aufs_branch *br; ++ loff_t pos; ++ ssize_t sz; ++ ++ LKTRTrace("b%d, hi%lu, i%lu\n", bindex, h_ino, xino->ino); ++ //DEBUG_ON(!xino->ino /* || !xino->h_gen */); ++ //WARN_ON(bindex == 0 && h_ino == 31); ++ ++ if (unlikely(!au_flag_test(sb, AuFlag_XINO))) ++ return 0; ++ ++ br = stobr(sb, bindex); ++ DEBUG_ON(!br || !br->br_xino); ++ pos = h_ino * sizeof(*xino); ++ sz = xino_fwrite(br->br_xino_write, br->br_xino, xino, sizeof(*xino), ++ &pos); ++ //if (LktrCond) sz = 1; ++ if (sz == sizeof(*xino)) ++ return 0; /* success */ ++ ++ IOErr("write failed (%ld)\n", (long)sz); ++ return -EIO; ++} ++ ++int xino_write0(struct super_block *sb, aufs_bindex_t bindex, ino_t h_ino) ++{ ++ struct xino xino = { ++ .ino = 0 ++ }; ++ return xino_write(sb, bindex, h_ino, &xino); ++} ++ ++// why is not atomic_long_inc_return defined? ++static DEFINE_SPINLOCK(alir_lock); ++static long atomic_long_inc_return(atomic_long_t *a) ++{ ++ long l; ++ ++ spin_lock(&alir_lock); ++ atomic_long_inc(a); ++ l = atomic_long_read(a); ++ spin_unlock(&alir_lock); ++ return l; ++} ++ ++ino_t xino_new_ino(struct super_block *sb) ++{ ++ ino_t ino; ++ ++ TraceEnter(); ++ ino = atomic_long_inc_return(&stosi(sb)->si_xino); ++ BUILD_BUG_ON(AUFS_FIRST_INO < AUFS_ROOT_INO); ++ if (ino >= AUFS_ROOT_INO) ++ return ino; ++ else { ++ atomic_long_dec(&stosi(sb)->si_xino); ++ IOErr1("inode number overflow\n"); ++ return 0; ++ } ++} ++ ++/* ++ * read @ino from xinofile for the specified branch{@sb, @bindex} ++ * at the position of @h_ino. ++ * if @ino does not exist and @do_new is true, get new one. ++ */ ++int xino_read(struct super_block *sb, aufs_bindex_t bindex, ino_t h_ino, ++ struct xino *xino) ++{ ++ int err; ++ struct aufs_branch *br; ++ struct file *file; ++ loff_t pos; ++ ssize_t sz; ++ ++ LKTRTrace("b%d, hi%lu\n", bindex, h_ino); ++ ++ err = 0; ++ xino->ino = 0; ++ if (unlikely(!au_flag_test(sb, AuFlag_XINO))) ++ return 0; /* no ino */ ++ ++ br = stobr(sb, bindex); ++ file = br->br_xino; ++ DEBUG_ON(!file); ++ pos = h_ino * sizeof(*xino); ++ if (i_size_read(file->f_dentry->d_inode) < pos + sizeof(*xino)) ++ return 0; /* no ino */ ++ ++ sz = xino_fread(br->br_xino_read, file, xino, sizeof(*xino), &pos); ++ if (sz == sizeof(*xino)) ++ return 0; /* success */ ++ ++ err = sz; ++ if (unlikely(sz >= 0)) { ++ err = -EIO; ++ IOErr("xino read error (%ld)\n", (long)sz); ++ } ++ ++ TraceErr(err); ++ return err; ++} ++ ++/* ---------------------------------------------------------------------- */ ++ ++struct file *xino_create(struct super_block *sb, char *fname, int silent, ++ struct dentry *parent) ++{ ++ struct file *file; ++ int err; ++ struct dentry *hidden_parent; ++ struct inode *hidden_dir; ++ //const int udba = au_flag_test(sb, AuFlag_UDBA_INOTIFY); ++ ++ LKTRTrace("%s\n", fname); ++ //DEBUG_ON(!au_flag_test(sb, AuFlag_XINO)); ++ ++ // LSM may detect it ++ // use sio? ++ file = vfsub_filp_open(fname, O_RDWR | O_CREAT | O_EXCL | O_LARGEFILE, ++ S_IRUGO | S_IWUGO); ++ //file = ERR_PTR(-1); ++ if (IS_ERR(file)) { ++ if (!silent) ++ Err("open %s(%ld)\n", fname, PTR_ERR(file)); ++ return file; ++ } ++#if 0 ++ if (unlikely(udba && parent)) ++ au_direval_dec(parent); ++#endif ++ ++ /* keep file count */ ++ hidden_parent = dget_parent(file->f_dentry); ++ hidden_dir = hidden_parent->d_inode; ++ hi_lock_parent(hidden_dir); ++ err = vfsub_unlink(hidden_dir, file->f_dentry, /*dlgt*/0); ++#if 0 ++ if (unlikely(!err && udba && parent)) ++ au_direval_dec(parent); ++#endif ++ i_unlock(hidden_dir); ++ dput(hidden_parent); ++ if (unlikely(err)) { ++ if (!silent) ++ Err("unlink %s(%d)\n", fname, err); ++ goto out; ++ } ++ if (sb != file->f_dentry->d_sb) ++ return file; /* success */ ++ ++ if (!silent) ++ Err("%s must be outside\n", fname); ++ err = -EINVAL; ++ ++ out: ++ fput(file); ++ file = ERR_PTR(err); ++ return file; ++} ++ ++/* ++ * find another branch who is on the same filesystem of the specified ++ * branch{@btgt}. search until @bend. ++ */ ++static int is_sb_shared(struct super_block *sb, aufs_bindex_t btgt, ++ aufs_bindex_t bend) ++{ ++ aufs_bindex_t bindex; ++ struct super_block *tgt_sb = sbr_sb(sb, btgt); ++ ++ for (bindex = 0; bindex <= bend; bindex++) ++ if (unlikely(btgt != bindex && tgt_sb == sbr_sb(sb, bindex))) ++ return bindex; ++ return -1; ++} ++ ++/* ++ * create a new xinofile at the same place/path as @base_file. ++ */ ++static struct file *xino_create2(struct file *base_file) ++{ ++ struct file *file; ++ int err; ++ struct dentry *base, *dentry, *parent; ++ struct inode *dir; ++ struct qstr *name; ++ struct lkup_args lkup = { ++ .nfsmnt = NULL, ++ .dlgt = 0 ++ }; ++ ++ base = base_file->f_dentry; ++ LKTRTrace("%.*s\n", DLNPair(base)); ++ parent = dget_parent(base); ++ dir = parent->d_inode; ++ IMustLock(dir); ++ ++ file = ERR_PTR(-EINVAL); ++ if (unlikely(au_is_nfs(parent->d_sb))) ++ goto out; ++ ++ // do not superio, nor NFS. ++ name = &base->d_name; ++ dentry = lkup_one(name->name, parent, name->len, &lkup); ++ //if (LktrCond) {dput(dentry); dentry = ERR_PTR(-1);} ++ if (IS_ERR(dentry)) { ++ file = (void*)dentry; ++ Err("%.*s lookup err %ld\n", LNPair(name), PTR_ERR(dentry)); ++ goto out; ++ } ++ err = vfsub_create(dir, dentry, S_IRUGO | S_IWUGO, NULL, /*dlgt*/0); ++ //if (LktrCond) {vfs_unlink(dir, dentry); err = -1;} ++ if (unlikely(err)) { ++ file = ERR_PTR(err); ++ Err("%.*s create err %d\n", LNPair(name), err); ++ goto out_dput; ++ } ++ file = dentry_open(dget(dentry), mntget(base_file->f_vfsmnt), ++ O_RDWR | O_CREAT | O_EXCL | O_LARGEFILE); ++ //if (LktrCond) {fput(file); file = ERR_PTR(-1);} ++ if (IS_ERR(file)) { ++ Err("%.*s open err %ld\n", LNPair(name), PTR_ERR(file)); ++ goto out_dput; ++ } ++ err = vfsub_unlink(dir, dentry, /*dlgt*/0); ++ //if (LktrCond) err = -1; ++ if (!err) ++ goto out_dput; /* success */ ++ ++ Err("%.*s unlink err %d\n", LNPair(name), err); ++ fput(file); ++ file = ERR_PTR(err); ++ ++ out_dput: ++ dput(dentry); ++ out: ++ dput(parent); ++ TraceErrPtr(file); ++ return file; ++} ++ ++/* ++ * initialize the xinofile for the specified branch{@sb, @bindex} ++ * at the place/path where @base_file indicates. ++ * test whether another branch is on the same filesystem or not, ++ * if @do_test is true. ++ */ ++int xino_init(struct super_block *sb, aufs_bindex_t bindex, ++ struct file *base_file, int do_test) ++{ ++ int err; ++ struct aufs_branch *br; ++ aufs_bindex_t bshared, bend; ++ struct file *file; ++ struct inode *inode, *hidden_inode; ++ struct xino xino; ++ ++ LKTRTrace("b%d, base_file %p, do_test %d\n", ++ bindex, base_file, do_test); ++ SiMustWriteLock(sb); ++ DEBUG_ON(!au_flag_test(sb, AuFlag_XINO)); ++ br = stobr(sb, bindex); ++ DEBUG_ON(br->br_xino); ++ ++ file = NULL; ++ bshared = -1; ++ bend = sbend(sb); ++ if (do_test) ++ bshared = is_sb_shared(sb, bindex, bend); ++ if (unlikely(bshared >= 0)) { ++ struct aufs_branch *shared_br = stobr(sb, bshared); ++ if (shared_br->br_xino) { ++ file = shared_br->br_xino; ++ get_file(file); ++ } ++ } ++ ++ if (!file) { ++ struct dentry *parent = dget_parent(base_file->f_dentry); ++ struct inode *dir = parent->d_inode; ++ ++ hi_lock_parent(dir); ++ file = xino_create2(base_file); ++ //if (LktrCond) {fput(file); file = ERR_PTR(-1);} ++ i_unlock(dir); ++ dput(parent); ++ err = PTR_ERR(file); ++ if (IS_ERR(file)) ++ goto out; ++ } ++ br->br_xino_read = find_readf(file); ++ err = PTR_ERR(br->br_xino_read); ++ if (IS_ERR(br->br_xino_read)) ++ goto out_put; ++ br->br_xino_write = find_writef(file); ++ err = PTR_ERR(br->br_xino_write); ++ if (IS_ERR(br->br_xino_write)) ++ goto out_put; ++ br->br_xino = file; ++ ++ inode = sb->s_root->d_inode; ++ hidden_inode = au_h_iptr_i(inode, bindex); ++ xino.ino = inode->i_ino; ++ //xino.h_gen = hidden_inode->i_generation; ++ //WARN_ON(xino.h_gen == AuXino_INVALID_HGEN); ++ err = xino_write(sb, bindex, hidden_inode->i_ino, &xino); ++ //if (LktrCond) err = -1; ++ if (!err) ++ return 0; /* success */ ++ ++ br->br_xino = NULL; ++ ++ out_put: ++ fput(file); ++ out: ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * set xino mount option. ++ */ ++int xino_set(struct super_block *sb, struct opt_xino *xino, int remount) ++{ ++ int err, sparse; ++ aufs_bindex_t bindex, bend; ++ struct aufs_branch *br; ++ struct dentry *parent; ++ struct qstr *name; ++ struct file *cur_xino; ++ struct inode *dir; ++ ++ LKTRTrace("%s\n", xino->path); ++ ++ err = 0; ++ name = &xino->file->f_dentry->d_name; ++ parent = dget_parent(xino->file->f_dentry); ++ dir = parent->d_inode; ++ cur_xino = stobr(sb, 0)->br_xino; ++ if (remount ++ && cur_xino ++ && cur_xino->f_dentry->d_parent == parent ++ && name->len == cur_xino->f_dentry->d_name.len ++ && !memcmp(name->name, cur_xino->f_dentry->d_name.name, name->len)) ++ goto out; ++ ++ au_flag_set(sb, AuFlag_XINO); ++ bend = sbend(sb); ++ for (bindex = bend; bindex >= 0; bindex--) { ++ br = stobr(sb, bindex); ++ if (unlikely(br->br_xino && file_count(br->br_xino) > 1)) { ++ fput(br->br_xino); ++ br->br_xino = NULL; ++ } ++ } ++ ++ for (bindex = 0; bindex <= bend; bindex++) { ++ struct file *file; ++ struct inode *inode; ++ ++ br = stobr(sb, bindex); ++ if (unlikely(!br->br_xino)) ++ continue; ++ ++ DEBUG_ON(file_count(br->br_xino) != 1); ++ hi_lock_parent(dir); ++ file = xino_create2(xino->file); ++ //if (LktrCond) {fput(file); file = ERR_PTR(-1);} ++ err = PTR_ERR(file); ++ if (IS_ERR(file)) { ++ i_unlock(dir); ++ break; ++ } ++ inode = br->br_xino->f_dentry->d_inode; ++ err = au_copy_file(file, br->br_xino, i_size_read(inode), sb, ++ &sparse); ++ //if (LktrCond) err = -1; ++ i_unlock(dir); ++ if (unlikely(err)) { ++ fput(file); ++ break; ++ } ++ fput(br->br_xino); ++ br->br_xino = file; ++ br->br_xino_read = find_readf(file); ++ DEBUG_ON(IS_ERR(br->br_xino_read)); ++ br->br_xino_write = find_writef(file); ++ DEBUG_ON(IS_ERR(br->br_xino_write)); ++ } ++ ++ for (bindex = 0; bindex <= bend; bindex++) ++ if (unlikely(!stobr(sb, bindex)->br_xino)) { ++ err = xino_init(sb, bindex, xino->file, /*do_test*/1); ++ //if (LktrCond) {fput(stobr(sb, bindex)->br_xino); ++ //stobr(sb, bindex)->br_xino = NULL; err = -1;} ++ if (!err) ++ continue; ++ IOErr("creating xino for branch %d(%d), " ++ "forcing noxino\n", bindex, err); ++ err = -EIO; ++ break; ++ } ++ out: ++ dput(parent); ++ if (!err) ++ au_flag_set(sb, AuFlag_XINO); ++ else ++ au_flag_clr(sb, AuFlag_XINO); ++ TraceErr(err); ++ return err; ++} ++ ++/* ++ * clear xino mount option ++ */ ++int xino_clr(struct super_block *sb) ++{ ++ aufs_bindex_t bindex, bend; ++ ++ TraceEnter(); ++ SiMustWriteLock(sb); ++ ++ bend = sbend(sb); ++ for (bindex = 0; bindex <= bend; bindex++) { ++ struct aufs_branch *br; ++ br = stobr(sb, bindex); ++ if (br->br_xino) { ++ fput(br->br_xino); ++ br->br_xino = NULL; ++ } ++ } ++ ++ //todo: need to make iunique() to return the larger inode number ++ ++ au_flag_clr(sb, AuFlag_XINO); ++ return 0; ++} ++ ++/* ++ * create a xinofile at the default place/path. ++ */ ++struct file *xino_def(struct super_block *sb) ++{ ++ struct file *file; ++ aufs_bindex_t bend, bindex, bwr; ++ char *page, *p; ++ ++ bend = sbend(sb); ++ bwr = -1; ++ for (bindex = 0; bindex <= bend; bindex++) ++ if (br_writable(sbr_perm(sb, bindex)) ++ && !au_is_nfs(au_h_dptr_i(sb->s_root, bindex)->d_sb)) { ++ bwr = bindex; ++ break; ++ } ++ ++ if (bwr != -1) { ++ // todo: rewrite with lkup_one() ++ file = ERR_PTR(-ENOMEM); ++ page = __getname(); ++ //if (LktrCond) {__putname(page); page = NULL;} ++ if (unlikely(!page)) ++ goto out; ++ p = d_path(au_h_dptr_i(sb->s_root, bwr), sbr_mnt(sb, bwr), page, ++ PATH_MAX - sizeof(AUFS_XINO_FNAME)); ++ //if (LktrCond) p = ERR_PTR(-1); ++ file = (void*)p; ++ if (p && !IS_ERR(p)) { ++ strcat(p, "/" AUFS_XINO_FNAME); ++ LKTRTrace("%s\n", p); ++ file = xino_create(sb, p, /*silent*/0, sb->s_root); ++ //if (LktrCond) {fput(file); file = ERR_PTR(-1);} ++ } ++ __putname(page); ++ } else { ++ file = xino_create(sb, AUFS_XINO_DEFPATH, /*silent*/0, ++ /*parent*/NULL); ++ //if (LktrCond) {fput(file); file = ERR_PTR(-1);} ++ } ++ ++ out: ++ TraceErrPtr(file); ++ return file; ++} +diff --git a/fs/squashfs/Makefile b/fs/squashfs/Makefile +new file mode 100644 +index 0000000..1bc7b06 +--- /dev/null ++++ b/fs/squashfs/Makefile +@@ -0,0 +1,7 @@ ++# ++# Makefile for the linux squashfs routines. ++# ++ ++obj-$(CONFIG_SQUASHFS) += squashfs.o ++squashfs-y += inode.o ++squashfs-y += squashfs2_0.o +diff --git a/fs/squashfs/inode.c b/fs/squashfs/inode.c +new file mode 100644 +index 0000000..895b699 +--- /dev/null ++++ b/fs/squashfs/inode.c +@@ -0,0 +1,2329 @@ ++/* ++ * Squashfs - a compressed read only filesystem for Linux ++ * ++ * Copyright (c) 2002, 2003, 2004, 2005, 2006, 2007 ++ * Phillip Lougher <phillip@lougher.org.uk> ++ * ++ * This program is free software; you can redistribute it and/or ++ * modify it under the terms of the GNU General Public License ++ * as published by the Free Software Foundation; either version 2, ++ * or (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. ++ * ++ * inode.c ++ */ ++ ++#include <linux/squashfs_fs.h> ++#include <linux/module.h> ++#include <linux/zlib.h> ++#include <linux/fs.h> ++#include <linux/squashfs_fs_sb.h> ++#include <linux/squashfs_fs_i.h> ++#include <linux/buffer_head.h> ++#include <linux/vfs.h> ++#include <linux/vmalloc.h> ++#include <linux/smp_lock.h> ++ ++#include "squashfs.h" ++ ++static void vfs_read_inode(struct inode *i); ++static struct dentry *squashfs_get_parent(struct dentry *child); ++static int squashfs_read_inode(struct inode *i, squashfs_inode_t inode); ++static int squashfs_statfs(struct dentry *, struct kstatfs *); ++static int squashfs_symlink_readpage(struct file *file, struct page *page); ++static long long read_blocklist(struct inode *inode, int index, ++ int readahead_blks, char *block_list, ++ unsigned short **block_p, unsigned int *bsize); ++static int squashfs_readpage(struct file *file, struct page *page); ++static int squashfs_readpage4K(struct file *file, struct page *page); ++static int squashfs_readdir(struct file *, void *, filldir_t); ++static struct dentry *squashfs_lookup(struct inode *, struct dentry *, ++ struct nameidata *); ++static int squashfs_remount(struct super_block *s, int *flags, char *data); ++static void squashfs_put_super(struct super_block *); ++static int squashfs_get_sb(struct file_system_type *,int, const char *, void *, ++ struct vfsmount *); ++static struct inode *squashfs_alloc_inode(struct super_block *sb); ++static void squashfs_destroy_inode(struct inode *inode); ++static int init_inodecache(void); ++static void destroy_inodecache(void); ++ ++static struct file_system_type squashfs_fs_type = { ++ .owner = THIS_MODULE, ++ .name = "squashfs", ++ .get_sb = squashfs_get_sb, ++ .kill_sb = kill_block_super, ++ .fs_flags = FS_REQUIRES_DEV ++}; ++ ++static const unsigned char squashfs_filetype_table[] = { ++ DT_UNKNOWN, DT_DIR, DT_REG, DT_LNK, DT_BLK, DT_CHR, DT_FIFO, DT_SOCK ++}; ++ ++static struct super_operations squashfs_super_ops = { ++ .alloc_inode = squashfs_alloc_inode, ++ .destroy_inode = squashfs_destroy_inode, ++ .statfs = squashfs_statfs, ++ .put_super = squashfs_put_super, ++ .remount_fs = squashfs_remount ++}; ++ ++static struct super_operations squashfs_export_super_ops = { ++ .alloc_inode = squashfs_alloc_inode, ++ .destroy_inode = squashfs_destroy_inode, ++ .statfs = squashfs_statfs, ++ .put_super = squashfs_put_super, ++ .read_inode = vfs_read_inode ++}; ++ ++static struct export_operations squashfs_export_ops = { ++ .get_parent = squashfs_get_parent ++}; ++ ++SQSH_EXTERN const struct address_space_operations squashfs_symlink_aops = { ++ .readpage = squashfs_symlink_readpage ++}; ++ ++SQSH_EXTERN const struct address_space_operations squashfs_aops = { ++ .readpage = squashfs_readpage ++}; ++ ++SQSH_EXTERN const struct address_space_operations squashfs_aops_4K = { ++ .readpage = squashfs_readpage4K ++}; ++ ++static const struct file_operations squashfs_dir_ops = { ++ .read = generic_read_dir, ++ .readdir = squashfs_readdir ++}; ++ ++SQSH_EXTERN struct inode_operations squashfs_dir_inode_ops = { ++ .lookup = squashfs_lookup ++}; ++ ++ ++static struct buffer_head *get_block_length(struct super_block *s, ++ int *cur_index, int *offset, int *c_byte) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ unsigned short temp; ++ struct buffer_head *bh; ++ ++ if (!(bh = sb_bread(s, *cur_index))) ++ goto out; ++ ++ if (msblk->devblksize - *offset == 1) { ++ if (msblk->swap) ++ ((unsigned char *) &temp)[1] = *((unsigned char *) ++ (bh->b_data + *offset)); ++ else ++ ((unsigned char *) &temp)[0] = *((unsigned char *) ++ (bh->b_data + *offset)); ++ brelse(bh); ++ if (!(bh = sb_bread(s, ++(*cur_index)))) ++ goto out; ++ if (msblk->swap) ++ ((unsigned char *) &temp)[0] = *((unsigned char *) ++ bh->b_data); ++ else ++ ((unsigned char *) &temp)[1] = *((unsigned char *) ++ bh->b_data); ++ *c_byte = temp; ++ *offset = 1; ++ } else { ++ if (msblk->swap) { ++ ((unsigned char *) &temp)[1] = *((unsigned char *) ++ (bh->b_data + *offset)); ++ ((unsigned char *) &temp)[0] = *((unsigned char *) ++ (bh->b_data + *offset + 1)); ++ } else { ++ ((unsigned char *) &temp)[0] = *((unsigned char *) ++ (bh->b_data + *offset)); ++ ((unsigned char *) &temp)[1] = *((unsigned char *) ++ (bh->b_data + *offset + 1)); ++ } ++ *c_byte = temp; ++ *offset += 2; ++ } ++ ++ if (SQUASHFS_CHECK_DATA(msblk->sblk.flags)) { ++ if (*offset == msblk->devblksize) { ++ brelse(bh); ++ if (!(bh = sb_bread(s, ++(*cur_index)))) ++ goto out; ++ *offset = 0; ++ } ++ if (*((unsigned char *) (bh->b_data + *offset)) != ++ SQUASHFS_MARKER_BYTE) { ++ ERROR("Metadata block marker corrupt @ %x\n", ++ *cur_index); ++ brelse(bh); ++ goto out; ++ } ++ (*offset)++; ++ } ++ return bh; ++ ++out: ++ return NULL; ++} ++ ++ ++SQSH_EXTERN unsigned int squashfs_read_data(struct super_block *s, char *buffer, ++ long long index, unsigned int length, ++ long long *next_index, int srclength) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ struct buffer_head *bh[((SQUASHFS_FILE_MAX_SIZE - 1) >> ++ msblk->devblksize_log2) + 2]; ++ unsigned int offset = index & ((1 << msblk->devblksize_log2) - 1); ++ unsigned int cur_index = index >> msblk->devblksize_log2; ++ int bytes, avail_bytes, b = 0, k = 0; ++ unsigned int compressed; ++ unsigned int c_byte = length; ++ ++ if (c_byte) { ++ bytes = msblk->devblksize - offset; ++ compressed = SQUASHFS_COMPRESSED_BLOCK(c_byte); ++ c_byte = SQUASHFS_COMPRESSED_SIZE_BLOCK(c_byte); ++ ++ TRACE("Block @ 0x%llx, %scompressed size %d, src size %d\n", index, compressed ++ ? "" : "un", (unsigned int) c_byte, srclength); ++ ++ if (c_byte > srclength || index < 0 || (index + c_byte) > sblk->bytes_used) ++ goto read_failure; ++ ++ if (!(bh[0] = sb_getblk(s, cur_index))) ++ goto block_release; ++ ++ for (b = 1; bytes < c_byte; b++) { ++ if (!(bh[b] = sb_getblk(s, ++cur_index))) ++ goto block_release; ++ bytes += msblk->devblksize; ++ } ++ ll_rw_block(READ, b, bh); ++ } else { ++ if (index < 0 || (index + 2) > sblk->bytes_used) ++ goto read_failure; ++ ++ if (!(bh[0] = get_block_length(s, &cur_index, &offset, ++ &c_byte))) ++ goto read_failure; ++ ++ bytes = msblk->devblksize - offset; ++ compressed = SQUASHFS_COMPRESSED(c_byte); ++ c_byte = SQUASHFS_COMPRESSED_SIZE(c_byte); ++ ++ TRACE("Block @ 0x%llx, %scompressed size %d\n", index, compressed ++ ? "" : "un", (unsigned int) c_byte); ++ ++ if (c_byte > srclength || (index + c_byte) > sblk->bytes_used) ++ goto read_failure; ++ ++ for (b = 1; bytes < c_byte; b++) { ++ if (!(bh[b] = sb_getblk(s, ++cur_index))) ++ goto block_release; ++ bytes += msblk->devblksize; ++ } ++ ll_rw_block(READ, b - 1, bh + 1); ++ } ++ ++ if (compressed) { ++ int zlib_err = 0; ++ ++ /* ++ * uncompress block ++ */ ++ ++ mutex_lock(&msblk->read_data_mutex); ++ ++ msblk->stream.next_out = buffer; ++ msblk->stream.avail_out = srclength; ++ ++ for (bytes = 0; k < b; k++) { ++ avail_bytes = (c_byte - bytes) > (msblk->devblksize - offset) ? ++ msblk->devblksize - offset : ++ c_byte - bytes; ++ wait_on_buffer(bh[k]); ++ if (!buffer_uptodate(bh[k])) ++ goto release_mutex; ++ ++ msblk->stream.next_in = bh[k]->b_data + offset; ++ msblk->stream.avail_in = avail_bytes; ++ ++ if (k == 0) { ++ zlib_err = zlib_inflateInit(&msblk->stream); ++ if (zlib_err != Z_OK) { ++ ERROR("zlib_inflateInit returned unexpected result 0x%x, srclength %d\n", ++ zlib_err, srclength); ++ goto release_mutex; ++ } ++ ++ if (avail_bytes == 0) { ++ offset = 0; ++ brelse(bh[k]); ++ continue; ++ } ++ } ++ ++ zlib_err = zlib_inflate(&msblk->stream, Z_NO_FLUSH); ++ if (zlib_err != Z_OK && zlib_err != Z_STREAM_END) { ++ ERROR("zlib_inflate returned unexpected result 0x%x, srclength %d, avail_in %d, avail_out %d\n", ++ zlib_err, srclength, msblk->stream.avail_in, msblk->stream.avail_out); ++ goto release_mutex; ++ } ++ ++ bytes += avail_bytes; ++ offset = 0; ++ brelse(bh[k]); ++ } ++ ++ if (zlib_err != Z_STREAM_END) ++ goto release_mutex; ++ ++ zlib_err = zlib_inflateEnd(&msblk->stream); ++ if (zlib_err != Z_OK) { ++ ERROR("zlib_inflateEnd returned unexpected result 0x%x, srclength %d\n", ++ zlib_err, srclength); ++ goto release_mutex; ++ } ++ bytes = msblk->stream.total_out; ++ mutex_unlock(&msblk->read_data_mutex); ++ } else { ++ int i; ++ ++ for(i = 0; i < b; i++) { ++ wait_on_buffer(bh[i]); ++ if(!buffer_uptodate(bh[i])) ++ goto block_release; ++ } ++ ++ for (bytes = 0; k < b; k++) { ++ avail_bytes = (c_byte - bytes) > (msblk->devblksize - offset) ? ++ msblk->devblksize - offset : ++ c_byte - bytes; ++ memcpy(buffer + bytes, bh[k]->b_data + offset, avail_bytes); ++ bytes += avail_bytes; ++ offset = 0; ++ brelse(bh[k]); ++ } ++ } ++ ++ if (next_index) ++ *next_index = index + c_byte + (length ? 0 : ++ (SQUASHFS_CHECK_DATA(msblk->sblk.flags) ++ ? 3 : 2)); ++ return bytes; ++ ++release_mutex: ++ mutex_unlock(&msblk->read_data_mutex); ++ ++block_release: ++ for (; k < b; k++) ++ brelse(bh[k]); ++ ++read_failure: ++ ERROR("sb_bread failed reading block 0x%x\n", cur_index); ++ return 0; ++} ++ ++ ++SQSH_EXTERN int squashfs_get_cached_block(struct super_block *s, char *buffer, ++ long long block, unsigned int offset, ++ int length, long long *next_block, ++ unsigned int *next_offset) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ int n, i, bytes, return_length = length; ++ long long next_index; ++ ++ TRACE("Entered squashfs_get_cached_block [%llx:%x]\n", block, offset); ++ ++ while ( 1 ) { ++ for (i = 0; i < SQUASHFS_CACHED_BLKS; i++) ++ if (msblk->block_cache[i].block == block) ++ break; ++ ++ mutex_lock(&msblk->block_cache_mutex); ++ ++ if (i == SQUASHFS_CACHED_BLKS) { ++ /* read inode header block */ ++ for (i = msblk->next_cache, n = SQUASHFS_CACHED_BLKS; ++ n ; n --, i = (i + 1) % ++ SQUASHFS_CACHED_BLKS) ++ if (msblk->block_cache[i].block != ++ SQUASHFS_USED_BLK) ++ break; ++ ++ if (n == 0) { ++ wait_queue_t wait; ++ ++ init_waitqueue_entry(&wait, current); ++ add_wait_queue(&msblk->waitq, &wait); ++ set_current_state(TASK_UNINTERRUPTIBLE); ++ mutex_unlock(&msblk->block_cache_mutex); ++ schedule(); ++ set_current_state(TASK_RUNNING); ++ remove_wait_queue(&msblk->waitq, &wait); ++ continue; ++ } ++ msblk->next_cache = (i + 1) % SQUASHFS_CACHED_BLKS; ++ ++ if (msblk->block_cache[i].block == ++ SQUASHFS_INVALID_BLK) { ++ if (!(msblk->block_cache[i].data = ++ kmalloc(SQUASHFS_METADATA_SIZE, ++ GFP_KERNEL))) { ++ ERROR("Failed to allocate cache" ++ "block\n"); ++ mutex_unlock(&msblk->block_cache_mutex); ++ goto out; ++ } ++ } ++ ++ msblk->block_cache[i].block = SQUASHFS_USED_BLK; ++ mutex_unlock(&msblk->block_cache_mutex); ++ ++ msblk->block_cache[i].length = squashfs_read_data(s, ++ msblk->block_cache[i].data, block, 0, &next_index, SQUASHFS_METADATA_SIZE); ++ if (msblk->block_cache[i].length == 0) { ++ ERROR("Unable to read cache block [%llx:%x]\n", ++ block, offset); ++ mutex_lock(&msblk->block_cache_mutex); ++ msblk->block_cache[i].block = SQUASHFS_INVALID_BLK; ++ kfree(msblk->block_cache[i].data); ++ wake_up(&msblk->waitq); ++ mutex_unlock(&msblk->block_cache_mutex); ++ goto out; ++ } ++ ++ mutex_lock(&msblk->block_cache_mutex); ++ wake_up(&msblk->waitq); ++ msblk->block_cache[i].block = block; ++ msblk->block_cache[i].next_index = next_index; ++ TRACE("Read cache block [%llx:%x]\n", block, offset); ++ } ++ ++ if (msblk->block_cache[i].block != block) { ++ mutex_unlock(&msblk->block_cache_mutex); ++ continue; ++ } ++ ++ bytes = msblk->block_cache[i].length - offset; ++ ++ if (bytes < 1) { ++ mutex_unlock(&msblk->block_cache_mutex); ++ goto out; ++ } else if (bytes >= length) { ++ if (buffer) ++ memcpy(buffer, msblk->block_cache[i].data + ++ offset, length); ++ if (msblk->block_cache[i].length - offset == length) { ++ *next_block = msblk->block_cache[i].next_index; ++ *next_offset = 0; ++ } else { ++ *next_block = block; ++ *next_offset = offset + length; ++ } ++ mutex_unlock(&msblk->block_cache_mutex); ++ goto finish; ++ } else { ++ if (buffer) { ++ memcpy(buffer, msblk->block_cache[i].data + ++ offset, bytes); ++ buffer += bytes; ++ } ++ block = msblk->block_cache[i].next_index; ++ mutex_unlock(&msblk->block_cache_mutex); ++ length -= bytes; ++ offset = 0; ++ } ++ } ++ ++finish: ++ return return_length; ++out: ++ return 0; ++} ++ ++ ++static int get_fragment_location(struct super_block *s, unsigned int fragment, ++ long long *fragment_start_block, ++ unsigned int *fragment_size) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ long long start_block = ++ msblk->fragment_index[SQUASHFS_FRAGMENT_INDEX(fragment)]; ++ int offset = SQUASHFS_FRAGMENT_INDEX_OFFSET(fragment); ++ struct squashfs_fragment_entry fragment_entry; ++ ++ if (msblk->swap) { ++ struct squashfs_fragment_entry sfragment_entry; ++ ++ if (!squashfs_get_cached_block(s, (char *) &sfragment_entry, ++ start_block, offset, ++ sizeof(sfragment_entry), &start_block, ++ &offset)) ++ goto out; ++ SQUASHFS_SWAP_FRAGMENT_ENTRY(&fragment_entry, &sfragment_entry); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) &fragment_entry, ++ start_block, offset, ++ sizeof(fragment_entry), &start_block, ++ &offset)) ++ goto out; ++ ++ *fragment_start_block = fragment_entry.start_block; ++ *fragment_size = fragment_entry.size; ++ ++ return 1; ++ ++out: ++ return 0; ++} ++ ++ ++SQSH_EXTERN void release_cached_fragment(struct squashfs_sb_info *msblk, struct ++ squashfs_fragment_cache *fragment) ++{ ++ mutex_lock(&msblk->fragment_mutex); ++ fragment->locked --; ++ wake_up(&msblk->fragment_wait_queue); ++ mutex_unlock(&msblk->fragment_mutex); ++} ++ ++ ++SQSH_EXTERN struct squashfs_fragment_cache *get_cached_fragment(struct super_block ++ *s, long long start_block, ++ int length) ++{ ++ int i, n; ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ ++ while ( 1 ) { ++ mutex_lock(&msblk->fragment_mutex); ++ ++ for (i = 0; i < SQUASHFS_CACHED_FRAGMENTS && ++ msblk->fragment[i].block != start_block; i++); ++ ++ if (i == SQUASHFS_CACHED_FRAGMENTS) { ++ for (i = msblk->next_fragment, n = ++ SQUASHFS_CACHED_FRAGMENTS; n && ++ msblk->fragment[i].locked; n--, i = (i + 1) % ++ SQUASHFS_CACHED_FRAGMENTS); ++ ++ if (n == 0) { ++ wait_queue_t wait; ++ ++ init_waitqueue_entry(&wait, current); ++ add_wait_queue(&msblk->fragment_wait_queue, ++ &wait); ++ set_current_state(TASK_UNINTERRUPTIBLE); ++ mutex_unlock(&msblk->fragment_mutex); ++ schedule(); ++ set_current_state(TASK_RUNNING); ++ remove_wait_queue(&msblk->fragment_wait_queue, ++ &wait); ++ continue; ++ } ++ msblk->next_fragment = (msblk->next_fragment + 1) % ++ SQUASHFS_CACHED_FRAGMENTS; ++ ++ if (msblk->fragment[i].data == NULL) ++ if (!(msblk->fragment[i].data = SQUASHFS_ALLOC ++ (SQUASHFS_FILE_MAX_SIZE))) { ++ ERROR("Failed to allocate fragment " ++ "cache block\n"); ++ mutex_unlock(&msblk->fragment_mutex); ++ goto out; ++ } ++ ++ msblk->fragment[i].block = SQUASHFS_INVALID_BLK; ++ msblk->fragment[i].locked = 1; ++ mutex_unlock(&msblk->fragment_mutex); ++ ++ if (!(msblk->fragment[i].length = squashfs_read_data(s, ++ msblk->fragment[i].data, ++ start_block, length, NULL, sblk->block_size))) { ++ ERROR("Unable to read fragment cache block " ++ "[%llx]\n", start_block); ++ msblk->fragment[i].locked = 0; ++ smp_mb(); ++ goto out; ++ } ++ ++ mutex_lock(&msblk->fragment_mutex); ++ msblk->fragment[i].block = start_block; ++ TRACE("New fragment %d, start block %lld, locked %d\n", ++ i, msblk->fragment[i].block, ++ msblk->fragment[i].locked); ++ mutex_unlock(&msblk->fragment_mutex); ++ break; ++ } ++ ++ msblk->fragment[i].locked++; ++ mutex_unlock(&msblk->fragment_mutex); ++ TRACE("Got fragment %d, start block %lld, locked %d\n", i, ++ msblk->fragment[i].block, ++ msblk->fragment[i].locked); ++ break; ++ } ++ ++ return &msblk->fragment[i]; ++ ++out: ++ return NULL; ++} ++ ++ ++static void squashfs_new_inode(struct squashfs_sb_info *msblk, struct inode *i, ++ struct squashfs_base_inode_header *inodeb) ++{ ++ i->i_ino = inodeb->inode_number; ++ i->i_mtime.tv_sec = inodeb->mtime; ++ i->i_atime.tv_sec = inodeb->mtime; ++ i->i_ctime.tv_sec = inodeb->mtime; ++ i->i_uid = msblk->uid[inodeb->uid]; ++ i->i_mode = inodeb->mode; ++ i->i_size = 0; ++ if (inodeb->guid == SQUASHFS_GUIDS) ++ i->i_gid = i->i_uid; ++ else ++ i->i_gid = msblk->guid[inodeb->guid]; ++} ++ ++ ++static squashfs_inode_t squashfs_inode_lookup(struct super_block *s, int ino) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ long long start = msblk->inode_lookup_table[SQUASHFS_LOOKUP_BLOCK(ino - 1)]; ++ int offset = SQUASHFS_LOOKUP_BLOCK_OFFSET(ino - 1); ++ squashfs_inode_t inode; ++ ++ TRACE("Entered squashfs_inode_lookup, inode_number = %d\n", ino); ++ ++ if (msblk->swap) { ++ squashfs_inode_t sinode; ++ ++ if (!squashfs_get_cached_block(s, (char *) &sinode, start, offset, ++ sizeof(sinode), &start, &offset)) ++ goto out; ++ SQUASHFS_SWAP_INODE_T((&inode), &sinode); ++ } else if (!squashfs_get_cached_block(s, (char *) &inode, start, offset, ++ sizeof(inode), &start, &offset)) ++ goto out; ++ ++ TRACE("squashfs_inode_lookup, inode = 0x%llx\n", inode); ++ ++ return inode; ++ ++out: ++ return SQUASHFS_INVALID_BLK; ++} ++ ++ ++static void vfs_read_inode(struct inode *i) ++{ ++ struct squashfs_sb_info *msblk = i->i_sb->s_fs_info; ++ squashfs_inode_t inode = squashfs_inode_lookup(i->i_sb, i->i_ino); ++ ++ TRACE("Entered vfs_read_inode\n"); ++ ++ if(inode != SQUASHFS_INVALID_BLK) ++ (msblk->read_inode)(i, inode); ++} ++ ++ ++static struct dentry *squashfs_get_parent(struct dentry *child) ++{ ++ struct inode *i = child->d_inode; ++ struct inode *parent = iget(i->i_sb, SQUASHFS_I(i)->u.s2.parent_inode); ++ struct dentry *rv; ++ ++ TRACE("Entered squashfs_get_parent\n"); ++ ++ if(parent == NULL) { ++ rv = ERR_PTR(-EACCES); ++ goto out; ++ } ++ ++ rv = d_alloc_anon(parent); ++ if(rv == NULL) ++ rv = ERR_PTR(-ENOMEM); ++ ++out: ++ return rv; ++} ++ ++ ++SQSH_EXTERN struct inode *squashfs_iget(struct super_block *s, squashfs_inode_t inode, unsigned int inode_number) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct inode *i = iget_locked(s, inode_number); ++ ++ TRACE("Entered squashfs_iget\n"); ++ ++ if(i && (i->i_state & I_NEW)) { ++ (msblk->read_inode)(i, inode); ++ unlock_new_inode(i); ++ } ++ ++ return i; ++} ++ ++ ++static int squashfs_read_inode(struct inode *i, squashfs_inode_t inode) ++{ ++ struct super_block *s = i->i_sb; ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ long long block = SQUASHFS_INODE_BLK(inode) + ++ sblk->inode_table_start; ++ unsigned int offset = SQUASHFS_INODE_OFFSET(inode); ++ long long next_block; ++ unsigned int next_offset; ++ union squashfs_inode_header id, sid; ++ struct squashfs_base_inode_header *inodeb = &id.base, ++ *sinodeb = &sid.base; ++ ++ TRACE("Entered squashfs_read_inode\n"); ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) sinodeb, block, ++ offset, sizeof(*sinodeb), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_BASE_INODE_HEADER(inodeb, sinodeb, ++ sizeof(*sinodeb)); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) inodeb, block, ++ offset, sizeof(*inodeb), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ squashfs_new_inode(msblk, i, inodeb); ++ ++ switch(inodeb->inode_type) { ++ case SQUASHFS_FILE_TYPE: { ++ unsigned int frag_size; ++ long long frag_blk; ++ struct squashfs_reg_inode_header *inodep = &id.reg; ++ struct squashfs_reg_inode_header *sinodep = &sid.reg; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_REG_INODE_HEADER(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ frag_blk = SQUASHFS_INVALID_BLK; ++ if (inodep->fragment != SQUASHFS_INVALID_FRAG && ++ !get_fragment_location(s, ++ inodep->fragment, &frag_blk, &frag_size)) ++ goto failed_read; ++ ++ i->i_nlink = 1; ++ i->i_size = inodep->file_size; ++ i->i_fop = &generic_ro_fops; ++ i->i_mode |= S_IFREG; ++ i->i_blocks = ((i->i_size - 1) >> 9) + 1; ++ SQUASHFS_I(i)->u.s1.fragment_start_block = frag_blk; ++ SQUASHFS_I(i)->u.s1.fragment_size = frag_size; ++ SQUASHFS_I(i)->u.s1.fragment_offset = inodep->offset; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->u.s1.block_list_start = next_block; ++ SQUASHFS_I(i)->offset = next_offset; ++ if (sblk->block_size > 4096) ++ i->i_data.a_ops = &squashfs_aops; ++ else ++ i->i_data.a_ops = &squashfs_aops_4K; ++ ++ TRACE("File inode %x:%x, start_block %llx, " ++ "block_list_start %llx, offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->start_block, next_block, ++ next_offset); ++ break; ++ } ++ case SQUASHFS_LREG_TYPE: { ++ unsigned int frag_size; ++ long long frag_blk; ++ struct squashfs_lreg_inode_header *inodep = &id.lreg; ++ struct squashfs_lreg_inode_header *sinodep = &sid.lreg; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_LREG_INODE_HEADER(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ frag_blk = SQUASHFS_INVALID_BLK; ++ if (inodep->fragment != SQUASHFS_INVALID_FRAG && ++ !get_fragment_location(s, ++ inodep->fragment, &frag_blk, &frag_size)) ++ goto failed_read; ++ ++ i->i_nlink = inodep->nlink; ++ i->i_size = inodep->file_size; ++ i->i_fop = &generic_ro_fops; ++ i->i_mode |= S_IFREG; ++ i->i_blocks = ((i->i_size - 1) >> 9) + 1; ++ SQUASHFS_I(i)->u.s1.fragment_start_block = frag_blk; ++ SQUASHFS_I(i)->u.s1.fragment_size = frag_size; ++ SQUASHFS_I(i)->u.s1.fragment_offset = inodep->offset; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->u.s1.block_list_start = next_block; ++ SQUASHFS_I(i)->offset = next_offset; ++ if (sblk->block_size > 4096) ++ i->i_data.a_ops = &squashfs_aops; ++ else ++ i->i_data.a_ops = &squashfs_aops_4K; ++ ++ TRACE("File inode %x:%x, start_block %llx, " ++ "block_list_start %llx, offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->start_block, next_block, ++ next_offset); ++ break; ++ } ++ case SQUASHFS_DIR_TYPE: { ++ struct squashfs_dir_inode_header *inodep = &id.dir; ++ struct squashfs_dir_inode_header *sinodep = &sid.dir; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_DIR_INODE_HEADER(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_nlink = inodep->nlink; ++ i->i_size = inodep->file_size; ++ i->i_op = &squashfs_dir_inode_ops; ++ i->i_fop = &squashfs_dir_ops; ++ i->i_mode |= S_IFDIR; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->offset = inodep->offset; ++ SQUASHFS_I(i)->u.s2.directory_index_count = 0; ++ SQUASHFS_I(i)->u.s2.parent_inode = inodep->parent_inode; ++ ++ TRACE("Directory inode %x:%x, start_block %x, offset " ++ "%x\n", SQUASHFS_INODE_BLK(inode), ++ offset, inodep->start_block, ++ inodep->offset); ++ break; ++ } ++ case SQUASHFS_LDIR_TYPE: { ++ struct squashfs_ldir_inode_header *inodep = &id.ldir; ++ struct squashfs_ldir_inode_header *sinodep = &sid.ldir; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_LDIR_INODE_HEADER(inodep, ++ sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_nlink = inodep->nlink; ++ i->i_size = inodep->file_size; ++ i->i_op = &squashfs_dir_inode_ops; ++ i->i_fop = &squashfs_dir_ops; ++ i->i_mode |= S_IFDIR; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->offset = inodep->offset; ++ SQUASHFS_I(i)->u.s2.directory_index_start = next_block; ++ SQUASHFS_I(i)->u.s2.directory_index_offset = ++ next_offset; ++ SQUASHFS_I(i)->u.s2.directory_index_count = ++ inodep->i_count; ++ SQUASHFS_I(i)->u.s2.parent_inode = inodep->parent_inode; ++ ++ TRACE("Long directory inode %x:%x, start_block %x, " ++ "offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->start_block, inodep->offset); ++ break; ++ } ++ case SQUASHFS_SYMLINK_TYPE: { ++ struct squashfs_symlink_inode_header *inodep = ++ &id.symlink; ++ struct squashfs_symlink_inode_header *sinodep = ++ &sid.symlink; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_SYMLINK_INODE_HEADER(inodep, ++ sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_nlink = inodep->nlink; ++ i->i_size = inodep->symlink_size; ++ i->i_op = &page_symlink_inode_operations; ++ i->i_data.a_ops = &squashfs_symlink_aops; ++ i->i_mode |= S_IFLNK; ++ SQUASHFS_I(i)->start_block = next_block; ++ SQUASHFS_I(i)->offset = next_offset; ++ ++ TRACE("Symbolic link inode %x:%x, start_block %llx, " ++ "offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ next_block, next_offset); ++ break; ++ } ++ case SQUASHFS_BLKDEV_TYPE: ++ case SQUASHFS_CHRDEV_TYPE: { ++ struct squashfs_dev_inode_header *inodep = &id.dev; ++ struct squashfs_dev_inode_header *sinodep = &sid.dev; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_DEV_INODE_HEADER(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_nlink = inodep->nlink; ++ i->i_mode |= (inodeb->inode_type == ++ SQUASHFS_CHRDEV_TYPE) ? S_IFCHR : ++ S_IFBLK; ++ init_special_inode(i, i->i_mode, ++ old_decode_dev(inodep->rdev)); ++ ++ TRACE("Device inode %x:%x, rdev %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->rdev); ++ break; ++ } ++ case SQUASHFS_FIFO_TYPE: ++ case SQUASHFS_SOCKET_TYPE: { ++ struct squashfs_ipc_inode_header *inodep = &id.ipc; ++ struct squashfs_ipc_inode_header *sinodep = &sid.ipc; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_IPC_INODE_HEADER(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_nlink = inodep->nlink; ++ i->i_mode |= (inodeb->inode_type == SQUASHFS_FIFO_TYPE) ++ ? S_IFIFO : S_IFSOCK; ++ init_special_inode(i, i->i_mode, 0); ++ break; ++ } ++ default: ++ ERROR("Unknown inode type %d in squashfs_iget!\n", ++ inodeb->inode_type); ++ goto failed_read1; ++ } ++ ++ return 1; ++ ++failed_read: ++ ERROR("Unable to read inode [%llx:%x]\n", block, offset); ++ ++failed_read1: ++ make_bad_inode(i); ++ return 0; ++} ++ ++ ++static int read_inode_lookup_table(struct super_block *s) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ unsigned int length = SQUASHFS_LOOKUP_BLOCK_BYTES(sblk->inodes); ++ ++ TRACE("In read_inode_lookup_table, length %d\n", length); ++ ++ /* Allocate inode lookup table */ ++ if (!(msblk->inode_lookup_table = kmalloc(length, GFP_KERNEL))) { ++ ERROR("Failed to allocate inode lookup table\n"); ++ return 0; ++ } ++ ++ if (!squashfs_read_data(s, (char *) msblk->inode_lookup_table, ++ sblk->lookup_table_start, length | ++ SQUASHFS_COMPRESSED_BIT_BLOCK, NULL, length)) { ++ ERROR("unable to read inode lookup table\n"); ++ return 0; ++ } ++ ++ if (msblk->swap) { ++ int i; ++ long long block; ++ ++ for (i = 0; i < SQUASHFS_LOOKUP_BLOCKS(sblk->inodes); i++) { ++ SQUASHFS_SWAP_LOOKUP_BLOCKS((&block), ++ &msblk->inode_lookup_table[i], 1); ++ msblk->inode_lookup_table[i] = block; ++ } ++ } ++ ++ return 1; ++} ++ ++ ++static int read_fragment_index_table(struct super_block *s) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ unsigned int length = SQUASHFS_FRAGMENT_INDEX_BYTES(sblk->fragments); ++ ++ if(length == 0) ++ return 1; ++ ++ /* Allocate fragment index table */ ++ if (!(msblk->fragment_index = kmalloc(length, GFP_KERNEL))) { ++ ERROR("Failed to allocate fragment index table\n"); ++ return 0; ++ } ++ ++ if (!squashfs_read_data(s, (char *) msblk->fragment_index, ++ sblk->fragment_table_start, length | ++ SQUASHFS_COMPRESSED_BIT_BLOCK, NULL, length)) { ++ ERROR("unable to read fragment index table\n"); ++ return 0; ++ } ++ ++ if (msblk->swap) { ++ int i; ++ long long fragment; ++ ++ for (i = 0; i < SQUASHFS_FRAGMENT_INDEXES(sblk->fragments); i++) { ++ SQUASHFS_SWAP_FRAGMENT_INDEXES((&fragment), ++ &msblk->fragment_index[i], 1); ++ msblk->fragment_index[i] = fragment; ++ } ++ } ++ ++ return 1; ++} ++ ++ ++static int supported_squashfs_filesystem(struct squashfs_sb_info *msblk, int silent) ++{ ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ ++ msblk->read_inode = squashfs_read_inode; ++ msblk->read_blocklist = read_blocklist; ++ msblk->read_fragment_index_table = read_fragment_index_table; ++ ++ if (sblk->s_major == 1) { ++ if (!squashfs_1_0_supported(msblk)) { ++ SERROR("Major/Minor mismatch, Squashfs 1.0 filesystems " ++ "are unsupported\n"); ++ SERROR("Please recompile with " ++ "Squashfs 1.0 support enabled\n"); ++ return 0; ++ } ++ } else if (sblk->s_major == 2) { ++ if (!squashfs_2_0_supported(msblk)) { ++ SERROR("Major/Minor mismatch, Squashfs 2.0 filesystems " ++ "are unsupported\n"); ++ SERROR("Please recompile with " ++ "Squashfs 2.0 support enabled\n"); ++ return 0; ++ } ++ } else if(sblk->s_major != SQUASHFS_MAJOR || sblk->s_minor > ++ SQUASHFS_MINOR) { ++ SERROR("Major/Minor mismatch, trying to mount newer %d.%d " ++ "filesystem\n", sblk->s_major, sblk->s_minor); ++ SERROR("Please update your kernel\n"); ++ return 0; ++ } ++ ++ return 1; ++} ++ ++ ++static int squashfs_fill_super(struct super_block *s, void *data, int silent) ++{ ++ struct squashfs_sb_info *msblk; ++ struct squashfs_super_block *sblk; ++ int i; ++ char b[BDEVNAME_SIZE]; ++ struct inode *root; ++ ++ TRACE("Entered squashfs_read_superblock\n"); ++ ++ if (!(s->s_fs_info = kmalloc(sizeof(struct squashfs_sb_info), ++ GFP_KERNEL))) { ++ ERROR("Failed to allocate superblock\n"); ++ goto failure; ++ } ++ memset(s->s_fs_info, 0, sizeof(struct squashfs_sb_info)); ++ msblk = s->s_fs_info; ++ if (!(msblk->stream.workspace = vmalloc(zlib_inflate_workspacesize()))) { ++ ERROR("Failed to allocate zlib workspace\n"); ++ goto failure; ++ } ++ sblk = &msblk->sblk; ++ ++ msblk->devblksize = sb_min_blocksize(s, BLOCK_SIZE); ++ msblk->devblksize_log2 = ffz(~msblk->devblksize); ++ ++ mutex_init(&msblk->read_data_mutex); ++ mutex_init(&msblk->read_page_mutex); ++ mutex_init(&msblk->block_cache_mutex); ++ mutex_init(&msblk->fragment_mutex); ++ mutex_init(&msblk->meta_index_mutex); ++ ++ init_waitqueue_head(&msblk->waitq); ++ init_waitqueue_head(&msblk->fragment_wait_queue); ++ ++ sblk->bytes_used = sizeof(struct squashfs_super_block); ++ if (!squashfs_read_data(s, (char *) sblk, SQUASHFS_START, ++ sizeof(struct squashfs_super_block) | ++ SQUASHFS_COMPRESSED_BIT_BLOCK, NULL, sizeof(struct squashfs_super_block))) { ++ SERROR("unable to read superblock\n"); ++ goto failed_mount; ++ } ++ ++ /* Check it is a SQUASHFS superblock */ ++ msblk->swap = 0; ++ if ((s->s_magic = sblk->s_magic) != SQUASHFS_MAGIC) { ++ if (sblk->s_magic == SQUASHFS_MAGIC_SWAP) { ++ struct squashfs_super_block ssblk; ++ ++ WARNING("Mounting a different endian SQUASHFS " ++ "filesystem on %s\n", bdevname(s->s_bdev, b)); ++ ++ SQUASHFS_SWAP_SUPER_BLOCK(&ssblk, sblk); ++ memcpy(sblk, &ssblk, sizeof(struct squashfs_super_block)); ++ msblk->swap = 1; ++ } else { ++ SERROR("Can't find a SQUASHFS superblock on %s\n", ++ bdevname(s->s_bdev, b)); ++ goto failed_mount; ++ } ++ } ++ ++ /* Check the MAJOR & MINOR versions */ ++ if(!supported_squashfs_filesystem(msblk, silent)) ++ goto failed_mount; ++ ++ /* Check the filesystem does not extend beyond the end of the ++ block device */ ++ if(sblk->bytes_used < 0 || sblk->bytes_used > i_size_read(s->s_bdev->bd_inode)) ++ goto failed_mount; ++ ++ /* Check the root inode for sanity */ ++ if (SQUASHFS_INODE_OFFSET(sblk->root_inode) > SQUASHFS_METADATA_SIZE) ++ goto failed_mount; ++ ++ TRACE("Found valid superblock on %s\n", bdevname(s->s_bdev, b)); ++ TRACE("Inodes are %scompressed\n", ++ SQUASHFS_UNCOMPRESSED_INODES ++ (sblk->flags) ? "un" : ""); ++ TRACE("Data is %scompressed\n", ++ SQUASHFS_UNCOMPRESSED_DATA(sblk->flags) ++ ? "un" : ""); ++ TRACE("Check data is %s present in the filesystem\n", ++ SQUASHFS_CHECK_DATA(sblk->flags) ? ++ "" : "not"); ++ TRACE("Filesystem size %lld bytes\n", sblk->bytes_used); ++ TRACE("Block size %d\n", sblk->block_size); ++ TRACE("Number of inodes %d\n", sblk->inodes); ++ if (sblk->s_major > 1) ++ TRACE("Number of fragments %d\n", sblk->fragments); ++ TRACE("Number of uids %d\n", sblk->no_uids); ++ TRACE("Number of gids %d\n", sblk->no_guids); ++ TRACE("sblk->inode_table_start %llx\n", sblk->inode_table_start); ++ TRACE("sblk->directory_table_start %llx\n", sblk->directory_table_start); ++ if (sblk->s_major > 1) ++ TRACE("sblk->fragment_table_start %llx\n", ++ sblk->fragment_table_start); ++ TRACE("sblk->uid_start %llx\n", sblk->uid_start); ++ ++ s->s_flags |= MS_RDONLY; ++ s->s_op = &squashfs_super_ops; ++ ++ /* Init inode_table block pointer array */ ++ if (!(msblk->block_cache = kmalloc(sizeof(struct squashfs_cache) * ++ SQUASHFS_CACHED_BLKS, GFP_KERNEL))) { ++ ERROR("Failed to allocate block cache\n"); ++ goto failed_mount; ++ } ++ ++ for (i = 0; i < SQUASHFS_CACHED_BLKS; i++) ++ msblk->block_cache[i].block = SQUASHFS_INVALID_BLK; ++ ++ msblk->next_cache = 0; ++ ++ /* Allocate read_page block */ ++ if (!(msblk->read_page = kmalloc(sblk->block_size, GFP_KERNEL))) { ++ ERROR("Failed to allocate read_page block\n"); ++ goto failed_mount; ++ } ++ ++ /* Allocate uid and gid tables */ ++ if (!(msblk->uid = kmalloc((sblk->no_uids + sblk->no_guids) * ++ sizeof(unsigned int), GFP_KERNEL))) { ++ ERROR("Failed to allocate uid/gid table\n"); ++ goto failed_mount; ++ } ++ msblk->guid = msblk->uid + sblk->no_uids; ++ ++ if (msblk->swap) { ++ unsigned int suid[sblk->no_uids + sblk->no_guids]; ++ ++ if (!squashfs_read_data(s, (char *) &suid, sblk->uid_start, ++ ((sblk->no_uids + sblk->no_guids) * ++ sizeof(unsigned int)) | ++ SQUASHFS_COMPRESSED_BIT_BLOCK, NULL, (sblk->no_uids + sblk->no_guids) * sizeof(unsigned int))) { ++ ERROR("unable to read uid/gid table\n"); ++ goto failed_mount; ++ } ++ ++ SQUASHFS_SWAP_DATA(msblk->uid, suid, (sblk->no_uids + ++ sblk->no_guids), (sizeof(unsigned int) * 8)); ++ } else ++ if (!squashfs_read_data(s, (char *) msblk->uid, sblk->uid_start, ++ ((sblk->no_uids + sblk->no_guids) * ++ sizeof(unsigned int)) | ++ SQUASHFS_COMPRESSED_BIT_BLOCK, NULL, (sblk->no_uids + sblk->no_guids) * sizeof(unsigned int))) { ++ ERROR("unable to read uid/gid table\n"); ++ goto failed_mount; ++ } ++ ++ ++ if (sblk->s_major == 1 && squashfs_1_0_supported(msblk)) ++ goto allocate_root; ++ ++ if (!(msblk->fragment = kmalloc(sizeof(struct squashfs_fragment_cache) * ++ SQUASHFS_CACHED_FRAGMENTS, GFP_KERNEL))) { ++ ERROR("Failed to allocate fragment block cache\n"); ++ goto failed_mount; ++ } ++ ++ for (i = 0; i < SQUASHFS_CACHED_FRAGMENTS; i++) { ++ msblk->fragment[i].locked = 0; ++ msblk->fragment[i].block = SQUASHFS_INVALID_BLK; ++ msblk->fragment[i].data = NULL; ++ } ++ ++ msblk->next_fragment = 0; ++ ++ /* Allocate and read fragment index table */ ++ if (msblk->read_fragment_index_table(s) == 0) ++ goto failed_mount; ++ ++ if(sblk->s_major < 3 || sblk->lookup_table_start == SQUASHFS_INVALID_BLK) ++ goto allocate_root; ++ ++ /* Allocate and read inode lookup table */ ++ if (read_inode_lookup_table(s) == 0) ++ goto failed_mount; ++ ++ s->s_op = &squashfs_export_super_ops; ++ s->s_export_op = &squashfs_export_ops; ++ ++allocate_root: ++ root = new_inode(s); ++ if ((msblk->read_inode)(root, sblk->root_inode) == 0) ++ goto failed_mount; ++ insert_inode_hash(root); ++ ++ if ((s->s_root = d_alloc_root(root)) == NULL) { ++ ERROR("Root inode create failed\n"); ++ iput(root); ++ goto failed_mount; ++ } ++ ++ TRACE("Leaving squashfs_read_super\n"); ++ return 0; ++ ++failed_mount: ++ kfree(msblk->inode_lookup_table); ++ kfree(msblk->fragment_index); ++ kfree(msblk->fragment); ++ kfree(msblk->uid); ++ kfree(msblk->read_page); ++ kfree(msblk->block_cache); ++ kfree(msblk->fragment_index_2); ++ vfree(msblk->stream.workspace); ++ kfree(s->s_fs_info); ++ s->s_fs_info = NULL; ++ return -EINVAL; ++ ++failure: ++ return -ENOMEM; ++} ++ ++ ++static int squashfs_statfs(struct dentry *dentry, struct kstatfs *buf) ++{ ++ struct squashfs_sb_info *msblk = dentry->d_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ ++ TRACE("Entered squashfs_statfs\n"); ++ ++ buf->f_type = SQUASHFS_MAGIC; ++ buf->f_bsize = sblk->block_size; ++ buf->f_blocks = ((sblk->bytes_used - 1) >> sblk->block_log) + 1; ++ buf->f_bfree = buf->f_bavail = 0; ++ buf->f_files = sblk->inodes; ++ buf->f_ffree = 0; ++ buf->f_namelen = SQUASHFS_NAME_LEN; ++ ++ return 0; ++} ++ ++ ++static int squashfs_symlink_readpage(struct file *file, struct page *page) ++{ ++ struct inode *inode = page->mapping->host; ++ int index = page->index << PAGE_CACHE_SHIFT, length, bytes; ++ long long block = SQUASHFS_I(inode)->start_block; ++ int offset = SQUASHFS_I(inode)->offset; ++ void *pageaddr = kmap(page); ++ ++ TRACE("Entered squashfs_symlink_readpage, page index %ld, start block " ++ "%llx, offset %x\n", page->index, ++ SQUASHFS_I(inode)->start_block, ++ SQUASHFS_I(inode)->offset); ++ ++ for (length = 0; length < index; length += bytes) { ++ if (!(bytes = squashfs_get_cached_block(inode->i_sb, NULL, ++ block, offset, PAGE_CACHE_SIZE, &block, ++ &offset))) { ++ ERROR("Unable to read symbolic link [%llx:%x]\n", block, ++ offset); ++ goto skip_read; ++ } ++ } ++ ++ if (length != index) { ++ ERROR("(squashfs_symlink_readpage) length != index\n"); ++ bytes = 0; ++ goto skip_read; ++ } ++ ++ bytes = (i_size_read(inode) - length) > PAGE_CACHE_SIZE ? PAGE_CACHE_SIZE : ++ i_size_read(inode) - length; ++ ++ if (!(bytes = squashfs_get_cached_block(inode->i_sb, pageaddr, block, ++ offset, bytes, &block, &offset))) ++ ERROR("Unable to read symbolic link [%llx:%x]\n", block, offset); ++ ++skip_read: ++ memset(pageaddr + bytes, 0, PAGE_CACHE_SIZE - bytes); ++ kunmap(page); ++ flush_dcache_page(page); ++ SetPageUptodate(page); ++ unlock_page(page); ++ ++ return 0; ++} ++ ++ ++struct meta_index *locate_meta_index(struct inode *inode, int index, int offset) ++{ ++ struct meta_index *meta = NULL; ++ struct squashfs_sb_info *msblk = inode->i_sb->s_fs_info; ++ int i; ++ ++ mutex_lock(&msblk->meta_index_mutex); ++ ++ TRACE("locate_meta_index: index %d, offset %d\n", index, offset); ++ ++ if(msblk->meta_index == NULL) ++ goto not_allocated; ++ ++ for (i = 0; i < SQUASHFS_META_NUMBER; i ++) ++ if (msblk->meta_index[i].inode_number == inode->i_ino && ++ msblk->meta_index[i].offset >= offset && ++ msblk->meta_index[i].offset <= index && ++ msblk->meta_index[i].locked == 0) { ++ TRACE("locate_meta_index: entry %d, offset %d\n", i, ++ msblk->meta_index[i].offset); ++ meta = &msblk->meta_index[i]; ++ offset = meta->offset; ++ } ++ ++ if (meta) ++ meta->locked = 1; ++ ++not_allocated: ++ mutex_unlock(&msblk->meta_index_mutex); ++ ++ return meta; ++} ++ ++ ++struct meta_index *empty_meta_index(struct inode *inode, int offset, int skip) ++{ ++ struct squashfs_sb_info *msblk = inode->i_sb->s_fs_info; ++ struct meta_index *meta = NULL; ++ int i; ++ ++ mutex_lock(&msblk->meta_index_mutex); ++ ++ TRACE("empty_meta_index: offset %d, skip %d\n", offset, skip); ++ ++ if(msblk->meta_index == NULL) { ++ if (!(msblk->meta_index = kmalloc(sizeof(struct meta_index) * ++ SQUASHFS_META_NUMBER, GFP_KERNEL))) { ++ ERROR("Failed to allocate meta_index\n"); ++ goto failed; ++ } ++ for(i = 0; i < SQUASHFS_META_NUMBER; i++) { ++ msblk->meta_index[i].inode_number = 0; ++ msblk->meta_index[i].locked = 0; ++ } ++ msblk->next_meta_index = 0; ++ } ++ ++ for(i = SQUASHFS_META_NUMBER; i && ++ msblk->meta_index[msblk->next_meta_index].locked; i --) ++ msblk->next_meta_index = (msblk->next_meta_index + 1) % ++ SQUASHFS_META_NUMBER; ++ ++ if(i == 0) { ++ TRACE("empty_meta_index: failed!\n"); ++ goto failed; ++ } ++ ++ TRACE("empty_meta_index: returned meta entry %d, %p\n", ++ msblk->next_meta_index, ++ &msblk->meta_index[msblk->next_meta_index]); ++ ++ meta = &msblk->meta_index[msblk->next_meta_index]; ++ msblk->next_meta_index = (msblk->next_meta_index + 1) % ++ SQUASHFS_META_NUMBER; ++ ++ meta->inode_number = inode->i_ino; ++ meta->offset = offset; ++ meta->skip = skip; ++ meta->entries = 0; ++ meta->locked = 1; ++ ++failed: ++ mutex_unlock(&msblk->meta_index_mutex); ++ return meta; ++} ++ ++ ++void release_meta_index(struct inode *inode, struct meta_index *meta) ++{ ++ meta->locked = 0; ++ smp_mb(); ++} ++ ++ ++static int read_block_index(struct super_block *s, int blocks, char *block_list, ++ long long *start_block, int *offset) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ unsigned int *block_listp; ++ int block = 0; ++ ++ if (msblk->swap) { ++ char sblock_list[blocks << 2]; ++ ++ if (!squashfs_get_cached_block(s, sblock_list, *start_block, ++ *offset, blocks << 2, start_block, offset)) { ++ ERROR("Unable to read block list [%llx:%x]\n", ++ *start_block, *offset); ++ goto failure; ++ } ++ SQUASHFS_SWAP_INTS(((unsigned int *)block_list), ++ ((unsigned int *)sblock_list), blocks); ++ } else ++ if (!squashfs_get_cached_block(s, block_list, *start_block, ++ *offset, blocks << 2, start_block, offset)) { ++ ERROR("Unable to read block list [%llx:%x]\n", ++ *start_block, *offset); ++ goto failure; ++ } ++ ++ for (block_listp = (unsigned int *) block_list; blocks; ++ block_listp++, blocks --) ++ block += SQUASHFS_COMPRESSED_SIZE_BLOCK(*block_listp); ++ ++ return block; ++ ++failure: ++ return -1; ++} ++ ++ ++#define SIZE 256 ++ ++static inline int calculate_skip(int blocks) { ++ int skip = (blocks - 1) / ((SQUASHFS_SLOTS * SQUASHFS_META_ENTRIES + 1) * SQUASHFS_META_INDEXES); ++ return skip >= 7 ? 7 : skip + 1; ++} ++ ++ ++static int get_meta_index(struct inode *inode, int index, ++ long long *index_block, int *index_offset, ++ long long *data_block, char *block_list) ++{ ++ struct squashfs_sb_info *msblk = inode->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ int skip = calculate_skip(i_size_read(inode) >> sblk->block_log); ++ int offset = 0; ++ struct meta_index *meta; ++ struct meta_entry *meta_entry; ++ long long cur_index_block = SQUASHFS_I(inode)->u.s1.block_list_start; ++ int cur_offset = SQUASHFS_I(inode)->offset; ++ long long cur_data_block = SQUASHFS_I(inode)->start_block; ++ int i; ++ ++ index /= SQUASHFS_META_INDEXES * skip; ++ ++ while ( offset < index ) { ++ meta = locate_meta_index(inode, index, offset + 1); ++ ++ if (meta == NULL) { ++ if ((meta = empty_meta_index(inode, offset + 1, ++ skip)) == NULL) ++ goto all_done; ++ } else { ++ if(meta->entries == 0) ++ goto failed; ++ offset = index < meta->offset + meta->entries ? index : ++ meta->offset + meta->entries - 1; ++ meta_entry = &meta->meta_entry[offset - meta->offset]; ++ cur_index_block = meta_entry->index_block + sblk->inode_table_start; ++ cur_offset = meta_entry->offset; ++ cur_data_block = meta_entry->data_block; ++ TRACE("get_meta_index: offset %d, meta->offset %d, " ++ "meta->entries %d\n", offset, meta->offset, ++ meta->entries); ++ TRACE("get_meta_index: index_block 0x%llx, offset 0x%x" ++ " data_block 0x%llx\n", cur_index_block, ++ cur_offset, cur_data_block); ++ } ++ ++ for (i = meta->offset + meta->entries; i <= index && ++ i < meta->offset + SQUASHFS_META_ENTRIES; i++) { ++ int blocks = skip * SQUASHFS_META_INDEXES; ++ ++ while (blocks) { ++ int block = blocks > (SIZE >> 2) ? (SIZE >> 2) : ++ blocks; ++ int res = read_block_index(inode->i_sb, block, ++ block_list, &cur_index_block, ++ &cur_offset); ++ ++ if (res == -1) ++ goto failed; ++ ++ cur_data_block += res; ++ blocks -= block; ++ } ++ ++ meta_entry = &meta->meta_entry[i - meta->offset]; ++ meta_entry->index_block = cur_index_block - sblk->inode_table_start; ++ meta_entry->offset = cur_offset; ++ meta_entry->data_block = cur_data_block; ++ meta->entries ++; ++ offset ++; ++ } ++ ++ TRACE("get_meta_index: meta->offset %d, meta->entries %d\n", ++ meta->offset, meta->entries); ++ ++ release_meta_index(inode, meta); ++ } ++ ++all_done: ++ *index_block = cur_index_block; ++ *index_offset = cur_offset; ++ *data_block = cur_data_block; ++ ++ return offset * SQUASHFS_META_INDEXES * skip; ++ ++failed: ++ release_meta_index(inode, meta); ++ return -1; ++} ++ ++ ++static long long read_blocklist(struct inode *inode, int index, ++ int readahead_blks, char *block_list, ++ unsigned short **block_p, unsigned int *bsize) ++{ ++ long long block_ptr; ++ int offset; ++ long long block; ++ int res = get_meta_index(inode, index, &block_ptr, &offset, &block, ++ block_list); ++ ++ TRACE("read_blocklist: res %d, index %d, block_ptr 0x%llx, offset" ++ " 0x%x, block 0x%llx\n", res, index, block_ptr, offset, ++ block); ++ ++ if(res == -1) ++ goto failure; ++ ++ index -= res; ++ ++ while ( index ) { ++ int blocks = index > (SIZE >> 2) ? (SIZE >> 2) : index; ++ int res = read_block_index(inode->i_sb, blocks, block_list, ++ &block_ptr, &offset); ++ if (res == -1) ++ goto failure; ++ block += res; ++ index -= blocks; ++ } ++ ++ if (read_block_index(inode->i_sb, 1, block_list, ++ &block_ptr, &offset) == -1) ++ goto failure; ++ *bsize = *((unsigned int *) block_list); ++ ++ return block; ++ ++failure: ++ return 0; ++} ++ ++ ++static int squashfs_readpage(struct file *file, struct page *page) ++{ ++ struct inode *inode = page->mapping->host; ++ struct squashfs_sb_info *msblk = inode->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ unsigned char *block_list; ++ long long block; ++ unsigned int bsize, i = 0, bytes = 0, byte_offset = 0; ++ int index = page->index >> (sblk->block_log - PAGE_CACHE_SHIFT); ++ void *pageaddr; ++ struct squashfs_fragment_cache *fragment = NULL; ++ char *data_ptr = msblk->read_page; ++ ++ int mask = (1 << (sblk->block_log - PAGE_CACHE_SHIFT)) - 1; ++ int start_index = page->index & ~mask; ++ int end_index = start_index | mask; ++ ++ TRACE("Entered squashfs_readpage, page index %lx, start block %llx\n", ++ page->index, ++ SQUASHFS_I(inode)->start_block); ++ ++ if (!(block_list = kmalloc(SIZE, GFP_KERNEL))) { ++ ERROR("Failed to allocate block_list\n"); ++ goto skip_read; ++ } ++ ++ if (page->index >= ((i_size_read(inode) + PAGE_CACHE_SIZE - 1) >> ++ PAGE_CACHE_SHIFT)) ++ goto skip_read; ++ ++ if (SQUASHFS_I(inode)->u.s1.fragment_start_block == SQUASHFS_INVALID_BLK ++ || index < (i_size_read(inode) >> ++ sblk->block_log)) { ++ if ((block = (msblk->read_blocklist)(inode, index, 1, ++ block_list, NULL, &bsize)) == 0) ++ goto skip_read; ++ ++ mutex_lock(&msblk->read_page_mutex); ++ ++ if (!(bytes = squashfs_read_data(inode->i_sb, msblk->read_page, ++ block, bsize, NULL, sblk->block_size))) { ++ ERROR("Unable to read page, block %llx, size %x\n", block, ++ bsize); ++ mutex_unlock(&msblk->read_page_mutex); ++ goto skip_read; ++ } ++ } else { ++ if ((fragment = get_cached_fragment(inode->i_sb, ++ SQUASHFS_I(inode)-> ++ u.s1.fragment_start_block, ++ SQUASHFS_I(inode)->u.s1.fragment_size)) ++ == NULL) { ++ ERROR("Unable to read page, block %llx, size %x\n", ++ SQUASHFS_I(inode)-> ++ u.s1.fragment_start_block, ++ (int) SQUASHFS_I(inode)-> ++ u.s1.fragment_size); ++ goto skip_read; ++ } ++ bytes = SQUASHFS_I(inode)->u.s1.fragment_offset + ++ (i_size_read(inode) & (sblk->block_size ++ - 1)); ++ byte_offset = SQUASHFS_I(inode)->u.s1.fragment_offset; ++ data_ptr = fragment->data; ++ } ++ ++ for (i = start_index; i <= end_index && byte_offset < bytes; ++ i++, byte_offset += PAGE_CACHE_SIZE) { ++ struct page *push_page; ++ int avail = (bytes - byte_offset) > PAGE_CACHE_SIZE ? ++ PAGE_CACHE_SIZE : bytes - byte_offset; ++ ++ TRACE("bytes %d, i %d, byte_offset %d, available_bytes %d\n", ++ bytes, i, byte_offset, avail); ++ ++ push_page = (i == page->index) ? page : ++ grab_cache_page_nowait(page->mapping, i); ++ ++ if (!push_page) ++ continue; ++ ++ if (PageUptodate(push_page)) ++ goto skip_page; ++ ++ pageaddr = kmap_atomic(push_page, KM_USER0); ++ memcpy(pageaddr, data_ptr + byte_offset, avail); ++ memset(pageaddr + avail, 0, PAGE_CACHE_SIZE - avail); ++ kunmap_atomic(pageaddr, KM_USER0); ++ flush_dcache_page(push_page); ++ SetPageUptodate(push_page); ++skip_page: ++ unlock_page(push_page); ++ if(i != page->index) ++ page_cache_release(push_page); ++ } ++ ++ if (SQUASHFS_I(inode)->u.s1.fragment_start_block == SQUASHFS_INVALID_BLK ++ || index < (i_size_read(inode) >> ++ sblk->block_log)) ++ mutex_unlock(&msblk->read_page_mutex); ++ else ++ release_cached_fragment(msblk, fragment); ++ ++ kfree(block_list); ++ return 0; ++ ++skip_read: ++ pageaddr = kmap_atomic(page, KM_USER0); ++ memset(pageaddr + bytes, 0, PAGE_CACHE_SIZE - bytes); ++ kunmap_atomic(pageaddr, KM_USER0); ++ flush_dcache_page(page); ++ SetPageUptodate(page); ++ unlock_page(page); ++ ++ kfree(block_list); ++ return 0; ++} ++ ++ ++static int squashfs_readpage4K(struct file *file, struct page *page) ++{ ++ struct inode *inode = page->mapping->host; ++ struct squashfs_sb_info *msblk = inode->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ unsigned char *block_list; ++ long long block; ++ unsigned int bsize, bytes = 0; ++ void *pageaddr; ++ ++ TRACE("Entered squashfs_readpage4K, page index %lx, start block %llx\n", ++ page->index, ++ SQUASHFS_I(inode)->start_block); ++ ++ if (page->index >= ((i_size_read(inode) + PAGE_CACHE_SIZE - 1) >> ++ PAGE_CACHE_SHIFT)) { ++ block_list = NULL; ++ goto skip_read; ++ } ++ ++ if (!(block_list = kmalloc(SIZE, GFP_KERNEL))) { ++ ERROR("Failed to allocate block_list\n"); ++ goto skip_read; ++ } ++ ++ if (SQUASHFS_I(inode)->u.s1.fragment_start_block == SQUASHFS_INVALID_BLK ++ || page->index < (i_size_read(inode) >> ++ sblk->block_log)) { ++ block = (msblk->read_blocklist)(inode, page->index, 1, ++ block_list, NULL, &bsize); ++ if(block == 0) ++ goto skip_read; ++ ++ mutex_lock(&msblk->read_page_mutex); ++ bytes = squashfs_read_data(inode->i_sb, msblk->read_page, block, ++ bsize, NULL, sblk->block_size); ++ if (bytes) { ++ pageaddr = kmap_atomic(page, KM_USER0); ++ memcpy(pageaddr, msblk->read_page, bytes); ++ kunmap_atomic(pageaddr, KM_USER0); ++ } else ++ ERROR("Unable to read page, block %llx, size %x\n", ++ block, bsize); ++ mutex_unlock(&msblk->read_page_mutex); ++ } else { ++ struct squashfs_fragment_cache *fragment = ++ get_cached_fragment(inode->i_sb, ++ SQUASHFS_I(inode)-> ++ u.s1.fragment_start_block, ++ SQUASHFS_I(inode)-> u.s1.fragment_size); ++ if (fragment) { ++ bytes = i_size_read(inode) & (sblk->block_size - 1); ++ pageaddr = kmap_atomic(page, KM_USER0); ++ memcpy(pageaddr, fragment->data + SQUASHFS_I(inode)-> ++ u.s1.fragment_offset, bytes); ++ kunmap_atomic(pageaddr, KM_USER0); ++ release_cached_fragment(msblk, fragment); ++ } else ++ ERROR("Unable to read page, block %llx, size %x\n", ++ SQUASHFS_I(inode)-> ++ u.s1.fragment_start_block, (int) ++ SQUASHFS_I(inode)-> u.s1.fragment_size); ++ } ++ ++skip_read: ++ pageaddr = kmap_atomic(page, KM_USER0); ++ memset(pageaddr + bytes, 0, PAGE_CACHE_SIZE - bytes); ++ kunmap_atomic(pageaddr, KM_USER0); ++ flush_dcache_page(page); ++ SetPageUptodate(page); ++ unlock_page(page); ++ ++ kfree(block_list); ++ return 0; ++} ++ ++ ++static int get_dir_index_using_offset(struct super_block *s, long long ++ *next_block, unsigned int *next_offset, ++ long long index_start, ++ unsigned int index_offset, int i_count, ++ long long f_pos) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ int i, length = 0; ++ struct squashfs_dir_index index; ++ ++ TRACE("Entered get_dir_index_using_offset, i_count %d, f_pos %d\n", ++ i_count, (unsigned int) f_pos); ++ ++ f_pos =- 3; ++ if (f_pos == 0) ++ goto finish; ++ ++ for (i = 0; i < i_count; i++) { ++ if (msblk->swap) { ++ struct squashfs_dir_index sindex; ++ squashfs_get_cached_block(s, (char *) &sindex, ++ index_start, index_offset, ++ sizeof(sindex), &index_start, ++ &index_offset); ++ SQUASHFS_SWAP_DIR_INDEX(&index, &sindex); ++ } else ++ squashfs_get_cached_block(s, (char *) &index, ++ index_start, index_offset, ++ sizeof(index), &index_start, ++ &index_offset); ++ ++ if (index.index > f_pos) ++ break; ++ ++ squashfs_get_cached_block(s, NULL, index_start, index_offset, ++ index.size + 1, &index_start, ++ &index_offset); ++ ++ length = index.index; ++ *next_block = index.start_block + sblk->directory_table_start; ++ } ++ ++ *next_offset = (length + *next_offset) % SQUASHFS_METADATA_SIZE; ++ ++finish: ++ return length + 3; ++} ++ ++ ++static int get_dir_index_using_name(struct super_block *s, long long ++ *next_block, unsigned int *next_offset, ++ long long index_start, ++ unsigned int index_offset, int i_count, ++ const char *name, int size) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ int i, length = 0; ++ struct squashfs_dir_index *index; ++ char *str; ++ ++ TRACE("Entered get_dir_index_using_name, i_count %d\n", i_count); ++ ++ if (!(str = kmalloc(sizeof(struct squashfs_dir_index) + ++ (SQUASHFS_NAME_LEN + 1) * 2, GFP_KERNEL))) { ++ ERROR("Failed to allocate squashfs_dir_index\n"); ++ goto failure; ++ } ++ ++ index = (struct squashfs_dir_index *) (str + SQUASHFS_NAME_LEN + 1); ++ strncpy(str, name, size); ++ str[size] = '\0'; ++ ++ for (i = 0; i < i_count; i++) { ++ if (msblk->swap) { ++ struct squashfs_dir_index sindex; ++ squashfs_get_cached_block(s, (char *) &sindex, ++ index_start, index_offset, ++ sizeof(sindex), &index_start, ++ &index_offset); ++ SQUASHFS_SWAP_DIR_INDEX(index, &sindex); ++ } else ++ squashfs_get_cached_block(s, (char *) index, ++ index_start, index_offset, ++ sizeof(struct squashfs_dir_index), ++ &index_start, &index_offset); ++ ++ squashfs_get_cached_block(s, index->name, index_start, ++ index_offset, index->size + 1, ++ &index_start, &index_offset); ++ ++ index->name[index->size + 1] = '\0'; ++ ++ if (strcmp(index->name, str) > 0) ++ break; ++ ++ length = index->index; ++ *next_block = index->start_block + sblk->directory_table_start; ++ } ++ ++ *next_offset = (length + *next_offset) % SQUASHFS_METADATA_SIZE; ++ kfree(str); ++failure: ++ return length + 3; ++} ++ ++ ++static int squashfs_readdir(struct file *file, void *dirent, filldir_t filldir) ++{ ++ struct inode *i = file->f_dentry->d_inode; ++ struct squashfs_sb_info *msblk = i->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ long long next_block = SQUASHFS_I(i)->start_block + ++ sblk->directory_table_start; ++ int next_offset = SQUASHFS_I(i)->offset, length = 0, ++ dir_count; ++ struct squashfs_dir_header dirh; ++ struct squashfs_dir_entry *dire; ++ ++ TRACE("Entered squashfs_readdir [%llx:%x]\n", next_block, next_offset); ++ ++ if (!(dire = kmalloc(sizeof(struct squashfs_dir_entry) + ++ SQUASHFS_NAME_LEN + 1, GFP_KERNEL))) { ++ ERROR("Failed to allocate squashfs_dir_entry\n"); ++ goto finish; ++ } ++ ++ while(file->f_pos < 3) { ++ char *name; ++ int size, i_ino; ++ ++ if(file->f_pos == 0) { ++ name = "."; ++ size = 1; ++ i_ino = i->i_ino; ++ } else { ++ name = ".."; ++ size = 2; ++ i_ino = SQUASHFS_I(i)->u.s2.parent_inode; ++ } ++ TRACE("Calling filldir(%x, %s, %d, %d, %d, %d)\n", ++ (unsigned int) dirent, name, size, (int) ++ file->f_pos, i_ino, ++ squashfs_filetype_table[1]); ++ ++ if (filldir(dirent, name, size, ++ file->f_pos, i_ino, ++ squashfs_filetype_table[1]) < 0) { ++ TRACE("Filldir returned less than 0\n"); ++ goto finish; ++ } ++ file->f_pos += size; ++ } ++ ++ length = get_dir_index_using_offset(i->i_sb, &next_block, &next_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_start, ++ SQUASHFS_I(i)->u.s2.directory_index_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_count, ++ file->f_pos); ++ ++ while (length < i_size_read(i)) { ++ /* read directory header */ ++ if (msblk->swap) { ++ struct squashfs_dir_header sdirh; ++ ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &sdirh, ++ next_block, next_offset, sizeof(sdirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdirh); ++ SQUASHFS_SWAP_DIR_HEADER(&dirh, &sdirh); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &dirh, ++ next_block, next_offset, sizeof(dirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(dirh); ++ } ++ ++ dir_count = dirh.count + 1; ++ while (dir_count--) { ++ if (msblk->swap) { ++ struct squashfs_dir_entry sdire; ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ &sdire, next_block, next_offset, ++ sizeof(sdire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdire); ++ SQUASHFS_SWAP_DIR_ENTRY(dire, &sdire); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ dire, next_block, next_offset, ++ sizeof(*dire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(*dire); ++ } ++ ++ if (!squashfs_get_cached_block(i->i_sb, dire->name, ++ next_block, next_offset, ++ dire->size + 1, &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += dire->size + 1; ++ ++ if (file->f_pos >= length) ++ continue; ++ ++ dire->name[dire->size + 1] = '\0'; ++ ++ TRACE("Calling filldir(%x, %s, %d, %d, %x:%x, %d, %d)\n", ++ (unsigned int) dirent, dire->name, ++ dire->size + 1, (int) file->f_pos, ++ dirh.start_block, dire->offset, ++ dirh.inode_number + dire->inode_number, ++ squashfs_filetype_table[dire->type]); ++ ++ if (filldir(dirent, dire->name, dire->size + 1, ++ file->f_pos, ++ dirh.inode_number + dire->inode_number, ++ squashfs_filetype_table[dire->type]) ++ < 0) { ++ TRACE("Filldir returned less than 0\n"); ++ goto finish; ++ } ++ file->f_pos = length; ++ } ++ } ++ ++finish: ++ kfree(dire); ++ return 0; ++ ++failed_read: ++ ERROR("Unable to read directory block [%llx:%x]\n", next_block, ++ next_offset); ++ kfree(dire); ++ return 0; ++} ++ ++ ++static struct dentry *squashfs_lookup(struct inode *i, struct dentry *dentry, ++ struct nameidata *nd) ++{ ++ const unsigned char *name = dentry->d_name.name; ++ int len = dentry->d_name.len; ++ struct inode *inode = NULL; ++ struct squashfs_sb_info *msblk = i->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ long long next_block = SQUASHFS_I(i)->start_block + ++ sblk->directory_table_start; ++ int next_offset = SQUASHFS_I(i)->offset, length = 0, ++ dir_count; ++ struct squashfs_dir_header dirh; ++ struct squashfs_dir_entry *dire; ++ ++ TRACE("Entered squashfs_lookup [%llx:%x]\n", next_block, next_offset); ++ ++ if (!(dire = kmalloc(sizeof(struct squashfs_dir_entry) + ++ SQUASHFS_NAME_LEN + 1, GFP_KERNEL))) { ++ ERROR("Failed to allocate squashfs_dir_entry\n"); ++ goto exit_lookup; ++ } ++ ++ if (len > SQUASHFS_NAME_LEN) ++ goto exit_lookup; ++ ++ length = get_dir_index_using_name(i->i_sb, &next_block, &next_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_start, ++ SQUASHFS_I(i)->u.s2.directory_index_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_count, name, ++ len); ++ ++ while (length < i_size_read(i)) { ++ /* read directory header */ ++ if (msblk->swap) { ++ struct squashfs_dir_header sdirh; ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &sdirh, ++ next_block, next_offset, sizeof(sdirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdirh); ++ SQUASHFS_SWAP_DIR_HEADER(&dirh, &sdirh); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &dirh, ++ next_block, next_offset, sizeof(dirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(dirh); ++ } ++ ++ dir_count = dirh.count + 1; ++ while (dir_count--) { ++ if (msblk->swap) { ++ struct squashfs_dir_entry sdire; ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ &sdire, next_block,next_offset, ++ sizeof(sdire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdire); ++ SQUASHFS_SWAP_DIR_ENTRY(dire, &sdire); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ dire, next_block,next_offset, ++ sizeof(*dire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(*dire); ++ } ++ ++ if (!squashfs_get_cached_block(i->i_sb, dire->name, ++ next_block, next_offset, dire->size + 1, ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += dire->size + 1; ++ ++ if (name[0] < dire->name[0]) ++ goto exit_lookup; ++ ++ if ((len == dire->size + 1) && !strncmp(name, dire->name, len)) { ++ squashfs_inode_t ino = SQUASHFS_MKINODE(dirh.start_block, ++ dire->offset); ++ ++ TRACE("calling squashfs_iget for directory " ++ "entry %s, inode %x:%x, %d\n", name, ++ dirh.start_block, dire->offset, ++ dirh.inode_number + dire->inode_number); ++ ++ inode = squashfs_iget(i->i_sb, ino, dirh.inode_number + dire->inode_number); ++ ++ goto exit_lookup; ++ } ++ } ++ } ++ ++exit_lookup: ++ kfree(dire); ++ if (inode) ++ return d_splice_alias(inode, dentry); ++ d_add(dentry, inode); ++ return ERR_PTR(0); ++ ++failed_read: ++ ERROR("Unable to read directory block [%llx:%x]\n", next_block, ++ next_offset); ++ goto exit_lookup; ++} ++ ++ ++static int squashfs_remount(struct super_block *s, int *flags, char *data) ++{ ++ *flags |= MS_RDONLY; ++ return 0; ++} ++ ++ ++static void squashfs_put_super(struct super_block *s) ++{ ++ int i; ++ ++ if (s->s_fs_info) { ++ struct squashfs_sb_info *sbi = s->s_fs_info; ++ if (sbi->block_cache) ++ for (i = 0; i < SQUASHFS_CACHED_BLKS; i++) ++ if (sbi->block_cache[i].block != ++ SQUASHFS_INVALID_BLK) ++ kfree(sbi->block_cache[i].data); ++ if (sbi->fragment) ++ for (i = 0; i < SQUASHFS_CACHED_FRAGMENTS; i++) ++ SQUASHFS_FREE(sbi->fragment[i].data); ++ kfree(sbi->fragment); ++ kfree(sbi->block_cache); ++ kfree(sbi->read_page); ++ kfree(sbi->uid); ++ kfree(sbi->fragment_index); ++ kfree(sbi->fragment_index_2); ++ kfree(sbi->meta_index); ++ vfree(sbi->stream.workspace); ++ kfree(s->s_fs_info); ++ s->s_fs_info = NULL; ++ } ++} ++ ++ ++static int squashfs_get_sb(struct file_system_type *fs_type, int flags, ++ const char *dev_name, void *data, ++ struct vfsmount *mnt) ++{ ++ return get_sb_bdev(fs_type, flags, dev_name, data, squashfs_fill_super, ++ mnt); ++} ++ ++ ++static int __init init_squashfs_fs(void) ++{ ++ int err = init_inodecache(); ++ if (err) ++ goto out; ++ ++ printk(KERN_INFO "squashfs: version 3.2-r2 (2007/01/15) " ++ "Phillip Lougher\n"); ++ ++ if ((err = register_filesystem(&squashfs_fs_type))) ++ destroy_inodecache(); ++ ++out: ++ return err; ++} ++ ++ ++static void __exit exit_squashfs_fs(void) ++{ ++ unregister_filesystem(&squashfs_fs_type); ++ destroy_inodecache(); ++} ++ ++ ++static struct kmem_cache * squashfs_inode_cachep; ++ ++ ++static struct inode *squashfs_alloc_inode(struct super_block *sb) ++{ ++ struct squashfs_inode_info *ei; ++ ei = kmem_cache_alloc(squashfs_inode_cachep, GFP_KERNEL); ++ if (!ei) ++ return NULL; ++ return &ei->vfs_inode; ++} ++ ++ ++static void squashfs_destroy_inode(struct inode *inode) ++{ ++ kmem_cache_free(squashfs_inode_cachep, SQUASHFS_I(inode)); ++} ++ ++ ++static void init_once(void * foo, struct kmem_cache * cachep, unsigned long flags) ++{ ++ struct squashfs_inode_info *ei = foo; ++ ++ if ((flags & (SLAB_CTOR_VERIFY|SLAB_CTOR_CONSTRUCTOR)) == ++ SLAB_CTOR_CONSTRUCTOR) ++ inode_init_once(&ei->vfs_inode); ++} ++ ++ ++static int __init init_inodecache(void) ++{ ++ squashfs_inode_cachep = kmem_cache_create("squashfs_inode_cache", ++ sizeof(struct squashfs_inode_info), ++ 0, SLAB_HWCACHE_ALIGN|SLAB_RECLAIM_ACCOUNT, ++ init_once, NULL); ++ if (squashfs_inode_cachep == NULL) ++ return -ENOMEM; ++ return 0; ++} ++ ++ ++static void destroy_inodecache(void) ++{ ++ kmem_cache_destroy(squashfs_inode_cachep); ++} ++ ++ ++module_init(init_squashfs_fs); ++module_exit(exit_squashfs_fs); ++MODULE_DESCRIPTION("squashfs 3.2-r2, a compressed read-only filesystem"); ++MODULE_AUTHOR("Phillip Lougher <phillip@lougher.org.uk>"); ++MODULE_LICENSE("GPL"); +diff --git a/fs/squashfs/squashfs.h b/fs/squashfs/squashfs.h +new file mode 100644 +index 0000000..6f863f0 +--- /dev/null ++++ b/fs/squashfs/squashfs.h +@@ -0,0 +1,87 @@ ++/* ++ * Squashfs - a compressed read only filesystem for Linux ++ * ++ * Copyright (c) 2002, 2003, 2004, 2005, 2006, 2007 ++ * Phillip Lougher <phillip@lougher.org.uk> ++ * ++ * This program is free software; you can redistribute it and/or ++ * modify it under the terms of the GNU General Public License ++ * as published by the Free Software Foundation; either version 2, ++ * or (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. ++ * ++ * squashfs.h ++ */ ++ ++#ifdef CONFIG_SQUASHFS_1_0_COMPATIBILITY ++#undef CONFIG_SQUASHFS_1_0_COMPATIBILITY ++#endif ++ ++#ifdef SQUASHFS_TRACE ++#define TRACE(s, args...) printk(KERN_NOTICE "SQUASHFS: "s, ## args) ++#else ++#define TRACE(s, args...) {} ++#endif ++ ++#define ERROR(s, args...) printk(KERN_ERR "SQUASHFS error: "s, ## args) ++ ++#define SERROR(s, args...) do { \ ++ if (!silent) \ ++ printk(KERN_ERR "SQUASHFS error: "s, ## args);\ ++ } while(0) ++ ++#define WARNING(s, args...) printk(KERN_WARNING "SQUASHFS: "s, ## args) ++ ++static inline struct squashfs_inode_info *SQUASHFS_I(struct inode *inode) ++{ ++ return list_entry(inode, struct squashfs_inode_info, vfs_inode); ++} ++ ++#if defined(CONFIG_SQUASHFS_1_0_COMPATIBILITY ) || defined(CONFIG_SQUASHFS_2_0_COMPATIBILITY) ++#define SQSH_EXTERN ++extern unsigned int squashfs_read_data(struct super_block *s, char *buffer, ++ long long index, unsigned int length, ++ long long *next_index, int srclength); ++extern int squashfs_get_cached_block(struct super_block *s, char *buffer, ++ long long block, unsigned int offset, ++ int length, long long *next_block, ++ unsigned int *next_offset); ++extern void release_cached_fragment(struct squashfs_sb_info *msblk, struct ++ squashfs_fragment_cache *fragment); ++extern struct squashfs_fragment_cache *get_cached_fragment(struct super_block ++ *s, long long start_block, ++ int length); ++extern struct inode *squashfs_iget(struct super_block *s, squashfs_inode_t inode, unsigned int inode_number); ++extern const struct address_space_operations squashfs_symlink_aops; ++extern const struct address_space_operations squashfs_aops; ++extern const struct address_space_operations squashfs_aops_4K; ++extern struct inode_operations squashfs_dir_inode_ops; ++#else ++#define SQSH_EXTERN static ++#endif ++ ++#ifdef CONFIG_SQUASHFS_1_0_COMPATIBILITY ++extern int squashfs_1_0_supported(struct squashfs_sb_info *msblk); ++#else ++static inline int squashfs_1_0_supported(struct squashfs_sb_info *msblk) ++{ ++ return 0; ++} ++#endif ++ ++#ifdef CONFIG_SQUASHFS_2_0_COMPATIBILITY ++extern int squashfs_2_0_supported(struct squashfs_sb_info *msblk); ++#else ++static inline int squashfs_2_0_supported(struct squashfs_sb_info *msblk) ++{ ++ return 0; ++} ++#endif +diff --git a/fs/squashfs/squashfs2_0.c b/fs/squashfs/squashfs2_0.c +new file mode 100644 +index 0000000..d8d9d55 +--- /dev/null ++++ b/fs/squashfs/squashfs2_0.c +@@ -0,0 +1,742 @@ ++/* ++ * Squashfs - a compressed read only filesystem for Linux ++ * ++ * Copyright (c) 2002, 2003, 2004, 2005, 2006, 2007 ++ * Phillip Lougher <phillip@lougher.org.uk> ++ * ++ * This program is free software; you can redistribute it and/or ++ * modify it under the terms of the GNU General Public License ++ * as published by the Free Software Foundation; either version 2, ++ * or (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. ++ * ++ * squashfs2_0.c ++ */ ++ ++#include <linux/squashfs_fs.h> ++#include <linux/module.h> ++#include <linux/zlib.h> ++#include <linux/fs.h> ++#include <linux/squashfs_fs_sb.h> ++#include <linux/squashfs_fs_i.h> ++ ++#include "squashfs.h" ++static int squashfs_readdir_2(struct file *file, void *dirent, filldir_t filldir); ++static struct dentry *squashfs_lookup_2(struct inode *, struct dentry *, ++ struct nameidata *); ++ ++static struct file_operations squashfs_dir_ops_2 = { ++ .read = generic_read_dir, ++ .readdir = squashfs_readdir_2 ++}; ++ ++static struct inode_operations squashfs_dir_inode_ops_2 = { ++ .lookup = squashfs_lookup_2 ++}; ++ ++static unsigned char squashfs_filetype_table[] = { ++ DT_UNKNOWN, DT_DIR, DT_REG, DT_LNK, DT_BLK, DT_CHR, DT_FIFO, DT_SOCK ++}; ++ ++static int read_fragment_index_table_2(struct super_block *s) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ ++ if (!(msblk->fragment_index_2 = kmalloc(SQUASHFS_FRAGMENT_INDEX_BYTES_2 ++ (sblk->fragments), GFP_KERNEL))) { ++ ERROR("Failed to allocate uid/gid table\n"); ++ return 0; ++ } ++ ++ if (SQUASHFS_FRAGMENT_INDEX_BYTES_2(sblk->fragments) && ++ !squashfs_read_data(s, (char *) ++ msblk->fragment_index_2, ++ sblk->fragment_table_start, ++ SQUASHFS_FRAGMENT_INDEX_BYTES_2 ++ (sblk->fragments) | ++ SQUASHFS_COMPRESSED_BIT_BLOCK, NULL, SQUASHFS_FRAGMENT_INDEX_BYTES_2(sblk->fragments))) { ++ ERROR("unable to read fragment index table\n"); ++ return 0; ++ } ++ ++ if (msblk->swap) { ++ int i; ++ unsigned int fragment; ++ ++ for (i = 0; i < SQUASHFS_FRAGMENT_INDEXES_2(sblk->fragments); ++ i++) { ++ SQUASHFS_SWAP_FRAGMENT_INDEXES_2((&fragment), ++ &msblk->fragment_index_2[i], 1); ++ msblk->fragment_index_2[i] = fragment; ++ } ++ } ++ ++ return 1; ++} ++ ++ ++static int get_fragment_location_2(struct super_block *s, unsigned int fragment, ++ long long *fragment_start_block, ++ unsigned int *fragment_size) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ long long start_block = ++ msblk->fragment_index_2[SQUASHFS_FRAGMENT_INDEX_2(fragment)]; ++ int offset = SQUASHFS_FRAGMENT_INDEX_OFFSET_2(fragment); ++ struct squashfs_fragment_entry_2 fragment_entry; ++ ++ if (msblk->swap) { ++ struct squashfs_fragment_entry_2 sfragment_entry; ++ ++ if (!squashfs_get_cached_block(s, (char *) &sfragment_entry, ++ start_block, offset, ++ sizeof(sfragment_entry), &start_block, ++ &offset)) ++ goto out; ++ SQUASHFS_SWAP_FRAGMENT_ENTRY_2(&fragment_entry, &sfragment_entry); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) &fragment_entry, ++ start_block, offset, ++ sizeof(fragment_entry), &start_block, ++ &offset)) ++ goto out; ++ ++ *fragment_start_block = fragment_entry.start_block; ++ *fragment_size = fragment_entry.size; ++ ++ return 1; ++ ++out: ++ return 0; ++} ++ ++ ++static void squashfs_new_inode(struct squashfs_sb_info *msblk, struct inode *i, ++ struct squashfs_base_inode_header_2 *inodeb, unsigned int ino) ++{ ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ ++ i->i_ino = ino; ++ i->i_mtime.tv_sec = sblk->mkfs_time; ++ i->i_atime.tv_sec = sblk->mkfs_time; ++ i->i_ctime.tv_sec = sblk->mkfs_time; ++ i->i_uid = msblk->uid[inodeb->uid]; ++ i->i_mode = inodeb->mode; ++ i->i_nlink = 1; ++ i->i_size = 0; ++ if (inodeb->guid == SQUASHFS_GUIDS) ++ i->i_gid = i->i_uid; ++ else ++ i->i_gid = msblk->guid[inodeb->guid]; ++} ++ ++ ++static int squashfs_read_inode_2(struct inode *i, squashfs_inode_t inode) ++{ ++ struct super_block *s = i->i_sb; ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ unsigned int block = SQUASHFS_INODE_BLK(inode) + ++ sblk->inode_table_start; ++ unsigned int offset = SQUASHFS_INODE_OFFSET(inode); ++ unsigned int ino = i->i_ino; ++ long long next_block; ++ unsigned int next_offset; ++ union squashfs_inode_header_2 id, sid; ++ struct squashfs_base_inode_header_2 *inodeb = &id.base, ++ *sinodeb = &sid.base; ++ ++ TRACE("Entered squashfs_iget\n"); ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) sinodeb, block, ++ offset, sizeof(*sinodeb), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_BASE_INODE_HEADER_2(inodeb, sinodeb, ++ sizeof(*sinodeb)); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) inodeb, block, ++ offset, sizeof(*inodeb), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ squashfs_new_inode(msblk, i, inodeb, ino); ++ ++ switch(inodeb->inode_type) { ++ case SQUASHFS_FILE_TYPE: { ++ struct squashfs_reg_inode_header_2 *inodep = &id.reg; ++ struct squashfs_reg_inode_header_2 *sinodep = &sid.reg; ++ long long frag_blk; ++ unsigned int frag_size = 0; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_REG_INODE_HEADER_2(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ frag_blk = SQUASHFS_INVALID_BLK; ++ if (inodep->fragment != SQUASHFS_INVALID_FRAG && ++ !get_fragment_location_2(s, ++ inodep->fragment, &frag_blk, &frag_size)) ++ goto failed_read; ++ ++ i->i_size = inodep->file_size; ++ i->i_fop = &generic_ro_fops; ++ i->i_mode |= S_IFREG; ++ i->i_mtime.tv_sec = inodep->mtime; ++ i->i_atime.tv_sec = inodep->mtime; ++ i->i_ctime.tv_sec = inodep->mtime; ++ i->i_blocks = ((i->i_size - 1) >> 9) + 1; ++ SQUASHFS_I(i)->u.s1.fragment_start_block = frag_blk; ++ SQUASHFS_I(i)->u.s1.fragment_size = frag_size; ++ SQUASHFS_I(i)->u.s1.fragment_offset = inodep->offset; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->u.s1.block_list_start = next_block; ++ SQUASHFS_I(i)->offset = next_offset; ++ if (sblk->block_size > 4096) ++ i->i_data.a_ops = &squashfs_aops; ++ else ++ i->i_data.a_ops = &squashfs_aops_4K; ++ ++ TRACE("File inode %x:%x, start_block %x, " ++ "block_list_start %llx, offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->start_block, next_block, ++ next_offset); ++ break; ++ } ++ case SQUASHFS_DIR_TYPE: { ++ struct squashfs_dir_inode_header_2 *inodep = &id.dir; ++ struct squashfs_dir_inode_header_2 *sinodep = &sid.dir; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_DIR_INODE_HEADER_2(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_size = inodep->file_size; ++ i->i_op = &squashfs_dir_inode_ops_2; ++ i->i_fop = &squashfs_dir_ops_2; ++ i->i_mode |= S_IFDIR; ++ i->i_mtime.tv_sec = inodep->mtime; ++ i->i_atime.tv_sec = inodep->mtime; ++ i->i_ctime.tv_sec = inodep->mtime; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->offset = inodep->offset; ++ SQUASHFS_I(i)->u.s2.directory_index_count = 0; ++ SQUASHFS_I(i)->u.s2.parent_inode = 0; ++ ++ TRACE("Directory inode %x:%x, start_block %x, offset " ++ "%x\n", SQUASHFS_INODE_BLK(inode), ++ offset, inodep->start_block, ++ inodep->offset); ++ break; ++ } ++ case SQUASHFS_LDIR_TYPE: { ++ struct squashfs_ldir_inode_header_2 *inodep = &id.ldir; ++ struct squashfs_ldir_inode_header_2 *sinodep = &sid.ldir; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_LDIR_INODE_HEADER_2(inodep, ++ sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_size = inodep->file_size; ++ i->i_op = &squashfs_dir_inode_ops_2; ++ i->i_fop = &squashfs_dir_ops_2; ++ i->i_mode |= S_IFDIR; ++ i->i_mtime.tv_sec = inodep->mtime; ++ i->i_atime.tv_sec = inodep->mtime; ++ i->i_ctime.tv_sec = inodep->mtime; ++ SQUASHFS_I(i)->start_block = inodep->start_block; ++ SQUASHFS_I(i)->offset = inodep->offset; ++ SQUASHFS_I(i)->u.s2.directory_index_start = next_block; ++ SQUASHFS_I(i)->u.s2.directory_index_offset = ++ next_offset; ++ SQUASHFS_I(i)->u.s2.directory_index_count = ++ inodep->i_count; ++ SQUASHFS_I(i)->u.s2.parent_inode = 0; ++ ++ TRACE("Long directory inode %x:%x, start_block %x, " ++ "offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->start_block, inodep->offset); ++ break; ++ } ++ case SQUASHFS_SYMLINK_TYPE: { ++ struct squashfs_symlink_inode_header_2 *inodep = ++ &id.symlink; ++ struct squashfs_symlink_inode_header_2 *sinodep = ++ &sid.symlink; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_SYMLINK_INODE_HEADER_2(inodep, ++ sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_size = inodep->symlink_size; ++ i->i_op = &page_symlink_inode_operations; ++ i->i_data.a_ops = &squashfs_symlink_aops; ++ i->i_mode |= S_IFLNK; ++ SQUASHFS_I(i)->start_block = next_block; ++ SQUASHFS_I(i)->offset = next_offset; ++ ++ TRACE("Symbolic link inode %x:%x, start_block %llx, " ++ "offset %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ next_block, next_offset); ++ break; ++ } ++ case SQUASHFS_BLKDEV_TYPE: ++ case SQUASHFS_CHRDEV_TYPE: { ++ struct squashfs_dev_inode_header_2 *inodep = &id.dev; ++ struct squashfs_dev_inode_header_2 *sinodep = &sid.dev; ++ ++ if (msblk->swap) { ++ if (!squashfs_get_cached_block(s, (char *) ++ sinodep, block, offset, ++ sizeof(*sinodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ SQUASHFS_SWAP_DEV_INODE_HEADER_2(inodep, sinodep); ++ } else ++ if (!squashfs_get_cached_block(s, (char *) ++ inodep, block, offset, ++ sizeof(*inodep), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ i->i_mode |= (inodeb->inode_type == ++ SQUASHFS_CHRDEV_TYPE) ? S_IFCHR : ++ S_IFBLK; ++ init_special_inode(i, i->i_mode, ++ old_decode_dev(inodep->rdev)); ++ ++ TRACE("Device inode %x:%x, rdev %x\n", ++ SQUASHFS_INODE_BLK(inode), offset, ++ inodep->rdev); ++ break; ++ } ++ case SQUASHFS_FIFO_TYPE: ++ case SQUASHFS_SOCKET_TYPE: { ++ ++ i->i_mode |= (inodeb->inode_type == SQUASHFS_FIFO_TYPE) ++ ? S_IFIFO : S_IFSOCK; ++ init_special_inode(i, i->i_mode, 0); ++ break; ++ } ++ default: ++ ERROR("Unknown inode type %d in squashfs_iget!\n", ++ inodeb->inode_type); ++ goto failed_read1; ++ } ++ ++ return 1; ++ ++failed_read: ++ ERROR("Unable to read inode [%x:%x]\n", block, offset); ++ ++failed_read1: ++ return 0; ++} ++ ++ ++static int get_dir_index_using_offset(struct super_block *s, long long ++ *next_block, unsigned int *next_offset, ++ long long index_start, ++ unsigned int index_offset, int i_count, ++ long long f_pos) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ int i, length = 0; ++ struct squashfs_dir_index_2 index; ++ ++ TRACE("Entered get_dir_index_using_offset, i_count %d, f_pos %d\n", ++ i_count, (unsigned int) f_pos); ++ ++ if (f_pos == 0) ++ goto finish; ++ ++ for (i = 0; i < i_count; i++) { ++ if (msblk->swap) { ++ struct squashfs_dir_index_2 sindex; ++ squashfs_get_cached_block(s, (char *) &sindex, ++ index_start, index_offset, ++ sizeof(sindex), &index_start, ++ &index_offset); ++ SQUASHFS_SWAP_DIR_INDEX_2(&index, &sindex); ++ } else ++ squashfs_get_cached_block(s, (char *) &index, ++ index_start, index_offset, ++ sizeof(index), &index_start, ++ &index_offset); ++ ++ if (index.index > f_pos) ++ break; ++ ++ squashfs_get_cached_block(s, NULL, index_start, index_offset, ++ index.size + 1, &index_start, ++ &index_offset); ++ ++ length = index.index; ++ *next_block = index.start_block + sblk->directory_table_start; ++ } ++ ++ *next_offset = (length + *next_offset) % SQUASHFS_METADATA_SIZE; ++ ++finish: ++ return length; ++} ++ ++ ++static int get_dir_index_using_name(struct super_block *s, long long ++ *next_block, unsigned int *next_offset, ++ long long index_start, ++ unsigned int index_offset, int i_count, ++ const char *name, int size) ++{ ++ struct squashfs_sb_info *msblk = s->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ int i, length = 0; ++ struct squashfs_dir_index_2 *index; ++ char *str; ++ ++ TRACE("Entered get_dir_index_using_name, i_count %d\n", i_count); ++ ++ if (!(str = kmalloc(sizeof(struct squashfs_dir_index) + ++ (SQUASHFS_NAME_LEN + 1) * 2, GFP_KERNEL))) { ++ ERROR("Failed to allocate squashfs_dir_index\n"); ++ goto failure; ++ } ++ ++ index = (struct squashfs_dir_index_2 *) (str + SQUASHFS_NAME_LEN + 1); ++ strncpy(str, name, size); ++ str[size] = '\0'; ++ ++ for (i = 0; i < i_count; i++) { ++ if (msblk->swap) { ++ struct squashfs_dir_index_2 sindex; ++ squashfs_get_cached_block(s, (char *) &sindex, ++ index_start, index_offset, ++ sizeof(sindex), &index_start, ++ &index_offset); ++ SQUASHFS_SWAP_DIR_INDEX_2(index, &sindex); ++ } else ++ squashfs_get_cached_block(s, (char *) index, ++ index_start, index_offset, ++ sizeof(struct squashfs_dir_index_2), ++ &index_start, &index_offset); ++ ++ squashfs_get_cached_block(s, index->name, index_start, ++ index_offset, index->size + 1, ++ &index_start, &index_offset); ++ ++ index->name[index->size + 1] = '\0'; ++ ++ if (strcmp(index->name, str) > 0) ++ break; ++ ++ length = index->index; ++ *next_block = index->start_block + sblk->directory_table_start; ++ } ++ ++ *next_offset = (length + *next_offset) % SQUASHFS_METADATA_SIZE; ++ kfree(str); ++failure: ++ return length; ++} ++ ++ ++static int squashfs_readdir_2(struct file *file, void *dirent, filldir_t filldir) ++{ ++ struct inode *i = file->f_dentry->d_inode; ++ struct squashfs_sb_info *msblk = i->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ long long next_block = SQUASHFS_I(i)->start_block + ++ sblk->directory_table_start; ++ int next_offset = SQUASHFS_I(i)->offset, length = 0, ++ dir_count; ++ struct squashfs_dir_header_2 dirh; ++ struct squashfs_dir_entry_2 *dire; ++ ++ TRACE("Entered squashfs_readdir_2 [%llx:%x]\n", next_block, next_offset); ++ ++ if (!(dire = kmalloc(sizeof(struct squashfs_dir_entry) + ++ SQUASHFS_NAME_LEN + 1, GFP_KERNEL))) { ++ ERROR("Failed to allocate squashfs_dir_entry\n"); ++ goto finish; ++ } ++ ++ length = get_dir_index_using_offset(i->i_sb, &next_block, &next_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_start, ++ SQUASHFS_I(i)->u.s2.directory_index_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_count, ++ file->f_pos); ++ ++ while (length < i_size_read(i)) { ++ /* read directory header */ ++ if (msblk->swap) { ++ struct squashfs_dir_header_2 sdirh; ++ ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &sdirh, ++ next_block, next_offset, sizeof(sdirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdirh); ++ SQUASHFS_SWAP_DIR_HEADER_2(&dirh, &sdirh); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &dirh, ++ next_block, next_offset, sizeof(dirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(dirh); ++ } ++ ++ dir_count = dirh.count + 1; ++ while (dir_count--) { ++ if (msblk->swap) { ++ struct squashfs_dir_entry_2 sdire; ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ &sdire, next_block, next_offset, ++ sizeof(sdire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdire); ++ SQUASHFS_SWAP_DIR_ENTRY_2(dire, &sdire); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ dire, next_block, next_offset, ++ sizeof(*dire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(*dire); ++ } ++ ++ if (!squashfs_get_cached_block(i->i_sb, dire->name, ++ next_block, next_offset, ++ dire->size + 1, &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += dire->size + 1; ++ ++ if (file->f_pos >= length) ++ continue; ++ ++ dire->name[dire->size + 1] = '\0'; ++ ++ TRACE("Calling filldir(%x, %s, %d, %d, %x:%x, %d)\n", ++ (unsigned int) dirent, dire->name, ++ dire->size + 1, (int) file->f_pos, ++ dirh.start_block, dire->offset, ++ squashfs_filetype_table[dire->type]); ++ ++ if (filldir(dirent, dire->name, dire->size + 1, ++ file->f_pos, SQUASHFS_MK_VFS_INODE( ++ dirh.start_block, dire->offset), ++ squashfs_filetype_table[dire->type]) ++ < 0) { ++ TRACE("Filldir returned less than 0\n"); ++ goto finish; ++ } ++ file->f_pos = length; ++ } ++ } ++ ++finish: ++ kfree(dire); ++ return 0; ++ ++failed_read: ++ ERROR("Unable to read directory block [%llx:%x]\n", next_block, ++ next_offset); ++ kfree(dire); ++ return 0; ++} ++ ++ ++static struct dentry *squashfs_lookup_2(struct inode *i, struct dentry *dentry, ++ struct nameidata *nd) ++{ ++ const unsigned char *name = dentry->d_name.name; ++ int len = dentry->d_name.len; ++ struct inode *inode = NULL; ++ struct squashfs_sb_info *msblk = i->i_sb->s_fs_info; ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ long long next_block = SQUASHFS_I(i)->start_block + ++ sblk->directory_table_start; ++ int next_offset = SQUASHFS_I(i)->offset, length = 0, ++ dir_count; ++ struct squashfs_dir_header_2 dirh; ++ struct squashfs_dir_entry_2 *dire; ++ int sorted = sblk->s_major == 2 && sblk->s_minor >= 1; ++ ++ TRACE("Entered squashfs_lookup_2 [%llx:%x]\n", next_block, next_offset); ++ ++ if (!(dire = kmalloc(sizeof(struct squashfs_dir_entry) + ++ SQUASHFS_NAME_LEN + 1, GFP_KERNEL))) { ++ ERROR("Failed to allocate squashfs_dir_entry\n"); ++ goto exit_loop; ++ } ++ ++ if (len > SQUASHFS_NAME_LEN) ++ goto exit_loop; ++ ++ length = get_dir_index_using_name(i->i_sb, &next_block, &next_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_start, ++ SQUASHFS_I(i)->u.s2.directory_index_offset, ++ SQUASHFS_I(i)->u.s2.directory_index_count, name, ++ len); ++ ++ while (length < i_size_read(i)) { ++ /* read directory header */ ++ if (msblk->swap) { ++ struct squashfs_dir_header_2 sdirh; ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &sdirh, ++ next_block, next_offset, sizeof(sdirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdirh); ++ SQUASHFS_SWAP_DIR_HEADER_2(&dirh, &sdirh); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) &dirh, ++ next_block, next_offset, sizeof(dirh), ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(dirh); ++ } ++ ++ dir_count = dirh.count + 1; ++ while (dir_count--) { ++ if (msblk->swap) { ++ struct squashfs_dir_entry_2 sdire; ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ &sdire, next_block,next_offset, ++ sizeof(sdire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(sdire); ++ SQUASHFS_SWAP_DIR_ENTRY_2(dire, &sdire); ++ } else { ++ if (!squashfs_get_cached_block(i->i_sb, (char *) ++ dire, next_block,next_offset, ++ sizeof(*dire), &next_block, ++ &next_offset)) ++ goto failed_read; ++ ++ length += sizeof(*dire); ++ } ++ ++ if (!squashfs_get_cached_block(i->i_sb, dire->name, ++ next_block, next_offset, dire->size + 1, ++ &next_block, &next_offset)) ++ goto failed_read; ++ ++ length += dire->size + 1; ++ ++ if (sorted && name[0] < dire->name[0]) ++ goto exit_loop; ++ ++ if ((len == dire->size + 1) && !strncmp(name, ++ dire->name, len)) { ++ squashfs_inode_t ino = ++ SQUASHFS_MKINODE(dirh.start_block, ++ dire->offset); ++ unsigned int inode_number = SQUASHFS_MK_VFS_INODE(dirh.start_block, ++ dire->offset); ++ ++ TRACE("calling squashfs_iget for directory " ++ "entry %s, inode %x:%x, %lld\n", name, ++ dirh.start_block, dire->offset, ino); ++ ++ inode = squashfs_iget(i->i_sb, ino, inode_number); ++ ++ goto exit_loop; ++ } ++ } ++ } ++ ++exit_loop: ++ kfree(dire); ++ d_add(dentry, inode); ++ return ERR_PTR(0); ++ ++failed_read: ++ ERROR("Unable to read directory block [%llx:%x]\n", next_block, ++ next_offset); ++ goto exit_loop; ++} ++ ++ ++int squashfs_2_0_supported(struct squashfs_sb_info *msblk) ++{ ++ struct squashfs_super_block *sblk = &msblk->sblk; ++ ++ msblk->read_inode = squashfs_read_inode_2; ++ msblk->read_fragment_index_table = read_fragment_index_table_2; ++ ++ sblk->bytes_used = sblk->bytes_used_2; ++ sblk->uid_start = sblk->uid_start_2; ++ sblk->guid_start = sblk->guid_start_2; ++ sblk->inode_table_start = sblk->inode_table_start_2; ++ sblk->directory_table_start = sblk->directory_table_start_2; ++ sblk->fragment_table_start = sblk->fragment_table_start_2; ++ ++ return 1; ++} +diff --git a/include/linux/aufs_type.h b/include/linux/aufs_type.h +new file mode 100755 +index 0000000..8b4629e +--- /dev/null ++++ b/include/linux/aufs_type.h +@@ -0,0 +1,97 @@ ++/* ++ * Copyright (C) 2005, 2006, 2007 Junjiro Okajima ++ * ++ * This program, aufs is free software; you can redistribute it and/or modify ++ * it under the terms of the GNU General Public License as published by ++ * the Free Software Foundation; either version 2 of the License, or ++ * (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA ++ */ ++ ++/* $Id: aufs_type.h,v 1.55 2007/05/14 03:40:57 sfjro Exp $ */ ++ ++#include <linux/ioctl.h> ++ ++#ifndef __AUFS_TYPE_H__ ++#define __AUFS_TYPE_H__ ++ ++#define AUFS_VERSION "20070514" ++ ++/* ---------------------------------------------------------------------- */ ++ ++#ifdef CONFIG_AUFS_BRANCH_MAX_127 ++typedef char aufs_bindex_t; ++#define AUFS_BRANCH_MAX 127 ++#else ++typedef short aufs_bindex_t; ++#ifdef CONFIG_AUFS_BRANCH_MAX_511 ++#define AUFS_BRANCH_MAX 511 ++#elif defined(CONFIG_AUFS_BRANCH_MAX_1023) ++#define AUFS_BRANCH_MAX 1023 ++#elif defined(CONFIG_AUFS_BRANCH_MAX_32767) ++#define AUFS_BRANCH_MAX 32767 ++#else ++#error unknown CONFIG_AUFS_BRANCH_MAX value ++#endif ++#endif ++ ++#define AUFS_NAME "aufs" ++#define AUFS_FSTYPE AUFS_NAME ++ ++#define AUFS_ROOT_INO 2 ++#define AUFS_FIRST_INO 11 ++ ++#define AUFS_WH_PFX ".wh." ++#define AUFS_WH_PFX_LEN ((int)sizeof(AUFS_WH_PFX) - 1) ++#define AUFS_XINO_FNAME "." AUFS_NAME ".xino" ++#define AUFS_XINO_DEFPATH "/tmp/" AUFS_XINO_FNAME ++#define AUFS_DIRWH_DEF 3 ++#define AUFS_RDCACHE_DEF 10 /* seconds */ ++#define AUFS_WKQ_NAME AUFS_NAME "d" ++#define AUFS_NWKQ_DEF 4 ++ ++#ifdef CONFIG_AUFS_COMPAT ++#define AUFS_DIROPQ_NAME "__dir_opaque" ++#else ++#define AUFS_DIROPQ_NAME AUFS_WH_PFX ".opq" /* whiteouted doubly */ ++#endif ++#define AUFS_WH_DIROPQ AUFS_WH_PFX AUFS_DIROPQ_NAME ++ ++/* will be whiteouted doubly */ ++#define AUFS_WH_BASENAME AUFS_WH_PFX AUFS_NAME ++#define AUFS_WH_PLINKDIR AUFS_WH_PFX "plink" ++ ++/* ---------------------------------------------------------------------- */ ++ ++/* ioctl */ ++enum {AuCtlErr, AuCtlErr_Last}; ++enum { ++ AuCtl_REFRESH, //AuCtl_REFRESHV, ++ //AuCtl_FLUSH_PLINK, ++ //AuCtl_CPUP, ++ AuCtl_CPDOWN, AuCtl_MVDOWN ++}; ++ ++struct aufs_ctl_cp { ++ int bsrc, bdst; ++ int err; ++}; ++ ++#define Type 'A' ++#define AUFS_CTL_REFRESH _IO(Type, AuCtl_REFRESH) ++//#define AUFS_CTL_REFRESHV _IO(Type, AuCtl_REFRESHV) ++//#define AUFS_CTL_FLUSH_PLINK _IOR(Type, AuCtl_FLUSH_PLINK) ++//#define AUFS_CTL_CPUP _IOWR(Type, AuCtl_CPUP, struct aufs_ctl_cp) ++#define AUFS_CTL_CPDOWN _IOWR(Type, AuCtl_CPDOWN, struct aufs_ctl_cp) ++#define AUFS_CTL_MVDOWN _IOWR(Type, AuCtl_MVDOWN, struct aufs_ctl_cp) ++#undef Type ++ ++#endif /* __AUFS_TYPE_H__ */ +diff --git a/include/linux/squashfs_fs.h b/include/linux/squashfs_fs.h +new file mode 100644 +index 0000000..a9380ad +--- /dev/null ++++ b/include/linux/squashfs_fs.h +@@ -0,0 +1,934 @@ ++#ifndef SQUASHFS_FS ++#define SQUASHFS_FS ++ ++/* ++ * Squashfs ++ * ++ * Copyright (c) 2002, 2003, 2004, 2005, 2006, 2007 ++ * Phillip Lougher <phillip@lougher.org.uk> ++ * ++ * This program is free software; you can redistribute it and/or ++ * modify it under the terms of the GNU General Public License ++ * as published by the Free Software Foundation; either version 2, ++ * or (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. ++ * ++ * squashfs_fs.h ++ */ ++ ++#ifndef CONFIG_SQUASHFS_2_0_COMPATIBILITY ++#define CONFIG_SQUASHFS_2_0_COMPATIBILITY ++#endif ++ ++#ifdef CONFIG_SQUASHFS_VMALLOC ++#define SQUASHFS_ALLOC(a) vmalloc(a) ++#define SQUASHFS_FREE(a) vfree(a) ++#else ++#define SQUASHFS_ALLOC(a) kmalloc(a, GFP_KERNEL) ++#define SQUASHFS_FREE(a) kfree(a) ++#endif ++#define SQUASHFS_CACHED_FRAGMENTS CONFIG_SQUASHFS_FRAGMENT_CACHE_SIZE ++#define SQUASHFS_MAJOR 3 ++#define SQUASHFS_MINOR 0 ++#define SQUASHFS_MAGIC 0x73717368 ++#define SQUASHFS_MAGIC_SWAP 0x68737173 ++#define SQUASHFS_START 0 ++ ++/* size of metadata (inode and directory) blocks */ ++#define SQUASHFS_METADATA_SIZE 8192 ++#define SQUASHFS_METADATA_LOG 13 ++ ++/* default size of data blocks */ ++#define SQUASHFS_FILE_SIZE 65536 ++#define SQUASHFS_FILE_LOG 16 ++ ++#define SQUASHFS_FILE_MAX_SIZE 65536 ++ ++/* Max number of uids and gids */ ++#define SQUASHFS_UIDS 256 ++#define SQUASHFS_GUIDS 255 ++ ++/* Max length of filename (not 255) */ ++#define SQUASHFS_NAME_LEN 256 ++ ++#define SQUASHFS_INVALID ((long long) 0xffffffffffff) ++#define SQUASHFS_INVALID_FRAG ((unsigned int) 0xffffffff) ++#define SQUASHFS_INVALID_BLK ((long long) -1) ++#define SQUASHFS_USED_BLK ((long long) -2) ++ ++/* Filesystem flags */ ++#define SQUASHFS_NOI 0 ++#define SQUASHFS_NOD 1 ++#define SQUASHFS_CHECK 2 ++#define SQUASHFS_NOF 3 ++#define SQUASHFS_NO_FRAG 4 ++#define SQUASHFS_ALWAYS_FRAG 5 ++#define SQUASHFS_DUPLICATE 6 ++#define SQUASHFS_EXPORT 7 ++ ++#define SQUASHFS_BIT(flag, bit) ((flag >> bit) & 1) ++ ++#define SQUASHFS_UNCOMPRESSED_INODES(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_NOI) ++ ++#define SQUASHFS_UNCOMPRESSED_DATA(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_NOD) ++ ++#define SQUASHFS_UNCOMPRESSED_FRAGMENTS(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_NOF) ++ ++#define SQUASHFS_NO_FRAGMENTS(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_NO_FRAG) ++ ++#define SQUASHFS_ALWAYS_FRAGMENTS(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_ALWAYS_FRAG) ++ ++#define SQUASHFS_DUPLICATES(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_DUPLICATE) ++ ++#define SQUASHFS_EXPORTABLE(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_EXPORT) ++ ++#define SQUASHFS_CHECK_DATA(flags) SQUASHFS_BIT(flags, \ ++ SQUASHFS_CHECK) ++ ++#define SQUASHFS_MKFLAGS(noi, nod, check_data, nof, no_frag, always_frag, \ ++ duplicate_checking, exortable) (noi | (nod << 1) | (check_data << 2) \ ++ | (nof << 3) | (no_frag << 4) | (always_frag << 5) | \ ++ (duplicate_checking << 6) | (exportable << 7)) ++ ++/* Max number of types and file types */ ++#define SQUASHFS_DIR_TYPE 1 ++#define SQUASHFS_FILE_TYPE 2 ++#define SQUASHFS_SYMLINK_TYPE 3 ++#define SQUASHFS_BLKDEV_TYPE 4 ++#define SQUASHFS_CHRDEV_TYPE 5 ++#define SQUASHFS_FIFO_TYPE 6 ++#define SQUASHFS_SOCKET_TYPE 7 ++#define SQUASHFS_LDIR_TYPE 8 ++#define SQUASHFS_LREG_TYPE 9 ++ ++/* 1.0 filesystem type definitions */ ++#define SQUASHFS_TYPES 5 ++#define SQUASHFS_IPC_TYPE 0 ++ ++/* Flag whether block is compressed or uncompressed, bit is set if block is ++ * uncompressed */ ++#define SQUASHFS_COMPRESSED_BIT (1 << 15) ++ ++#define SQUASHFS_COMPRESSED_SIZE(B) (((B) & ~SQUASHFS_COMPRESSED_BIT) ? \ ++ (B) & ~SQUASHFS_COMPRESSED_BIT : SQUASHFS_COMPRESSED_BIT) ++ ++#define SQUASHFS_COMPRESSED(B) (!((B) & SQUASHFS_COMPRESSED_BIT)) ++ ++#define SQUASHFS_COMPRESSED_BIT_BLOCK (1 << 24) ++ ++#define SQUASHFS_COMPRESSED_SIZE_BLOCK(B) (((B) & \ ++ ~SQUASHFS_COMPRESSED_BIT_BLOCK) ? (B) & \ ++ ~SQUASHFS_COMPRESSED_BIT_BLOCK : SQUASHFS_COMPRESSED_BIT_BLOCK) ++ ++#define SQUASHFS_COMPRESSED_BLOCK(B) (!((B) & SQUASHFS_COMPRESSED_BIT_BLOCK)) ++ ++/* ++ * Inode number ops. Inodes consist of a compressed block number, and an ++ * uncompressed offset within that block ++ */ ++#define SQUASHFS_INODE_BLK(a) ((unsigned int) ((a) >> 16)) ++ ++#define SQUASHFS_INODE_OFFSET(a) ((unsigned int) ((a) & 0xffff)) ++ ++#define SQUASHFS_MKINODE(A, B) ((squashfs_inode_t)(((squashfs_inode_t) (A)\ ++ << 16) + (B))) ++ ++/* Compute 32 bit VFS inode number from squashfs inode number */ ++#define SQUASHFS_MK_VFS_INODE(a, b) ((unsigned int) (((a) << 8) + \ ++ ((b) >> 2) + 1)) ++/* XXX */ ++ ++/* Translate between VFS mode and squashfs mode */ ++#define SQUASHFS_MODE(a) ((a) & 0xfff) ++ ++/* fragment and fragment table defines */ ++#define SQUASHFS_FRAGMENT_BYTES(A) ((A) * sizeof(struct squashfs_fragment_entry)) ++ ++#define SQUASHFS_FRAGMENT_INDEX(A) (SQUASHFS_FRAGMENT_BYTES(A) / \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_FRAGMENT_INDEX_OFFSET(A) (SQUASHFS_FRAGMENT_BYTES(A) % \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_FRAGMENT_INDEXES(A) ((SQUASHFS_FRAGMENT_BYTES(A) + \ ++ SQUASHFS_METADATA_SIZE - 1) / \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_FRAGMENT_INDEX_BYTES(A) (SQUASHFS_FRAGMENT_INDEXES(A) *\ ++ sizeof(long long)) ++ ++/* inode lookup table defines */ ++#define SQUASHFS_LOOKUP_BYTES(A) ((A) * sizeof(squashfs_inode_t)) ++ ++#define SQUASHFS_LOOKUP_BLOCK(A) (SQUASHFS_LOOKUP_BYTES(A) / \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_LOOKUP_BLOCK_OFFSET(A) (SQUASHFS_LOOKUP_BYTES(A) % \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_LOOKUP_BLOCKS(A) ((SQUASHFS_LOOKUP_BYTES(A) + \ ++ SQUASHFS_METADATA_SIZE - 1) / \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_LOOKUP_BLOCK_BYTES(A) (SQUASHFS_LOOKUP_BLOCKS(A) *\ ++ sizeof(long long)) ++ ++/* cached data constants for filesystem */ ++#define SQUASHFS_CACHED_BLKS 8 ++ ++#define SQUASHFS_MAX_FILE_SIZE_LOG 64 ++ ++#define SQUASHFS_MAX_FILE_SIZE ((long long) 1 << \ ++ (SQUASHFS_MAX_FILE_SIZE_LOG - 2)) ++ ++#define SQUASHFS_MARKER_BYTE 0xff ++ ++/* meta index cache */ ++#define SQUASHFS_META_INDEXES (SQUASHFS_METADATA_SIZE / sizeof(unsigned int)) ++#define SQUASHFS_META_ENTRIES 31 ++#define SQUASHFS_META_NUMBER 8 ++#define SQUASHFS_SLOTS 4 ++ ++struct meta_entry { ++ long long data_block; ++ unsigned int index_block; ++ unsigned short offset; ++ unsigned short pad; ++}; ++ ++struct meta_index { ++ unsigned int inode_number; ++ unsigned int offset; ++ unsigned short entries; ++ unsigned short skip; ++ unsigned short locked; ++ unsigned short pad; ++ struct meta_entry meta_entry[SQUASHFS_META_ENTRIES]; ++}; ++ ++ ++/* ++ * definitions for structures on disk ++ */ ++ ++typedef long long squashfs_block_t; ++typedef long long squashfs_inode_t; ++ ++struct squashfs_super_block { ++ unsigned int s_magic; ++ unsigned int inodes; ++ unsigned int bytes_used_2; ++ unsigned int uid_start_2; ++ unsigned int guid_start_2; ++ unsigned int inode_table_start_2; ++ unsigned int directory_table_start_2; ++ unsigned int s_major:16; ++ unsigned int s_minor:16; ++ unsigned int block_size_1:16; ++ unsigned int block_log:16; ++ unsigned int flags:8; ++ unsigned int no_uids:8; ++ unsigned int no_guids:8; ++ unsigned int mkfs_time /* time of filesystem creation */; ++ squashfs_inode_t root_inode; ++ unsigned int block_size; ++ unsigned int fragments; ++ unsigned int fragment_table_start_2; ++ long long bytes_used; ++ long long uid_start; ++ long long guid_start; ++ long long inode_table_start; ++ long long directory_table_start; ++ long long fragment_table_start; ++ long long lookup_table_start; ++} __attribute__ ((packed)); ++ ++struct squashfs_dir_index { ++ unsigned int index; ++ unsigned int start_block; ++ unsigned char size; ++ unsigned char name[0]; ++} __attribute__ ((packed)); ++ ++#define SQUASHFS_BASE_INODE_HEADER \ ++ unsigned int inode_type:4; \ ++ unsigned int mode:12; \ ++ unsigned int uid:8; \ ++ unsigned int guid:8; \ ++ unsigned int mtime; \ ++ unsigned int inode_number; ++ ++struct squashfs_base_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++} __attribute__ ((packed)); ++ ++struct squashfs_ipc_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ unsigned int nlink; ++} __attribute__ ((packed)); ++ ++struct squashfs_dev_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ unsigned int nlink; ++ unsigned short rdev; ++} __attribute__ ((packed)); ++ ++struct squashfs_symlink_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ unsigned int nlink; ++ unsigned short symlink_size; ++ char symlink[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_reg_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ squashfs_block_t start_block; ++ unsigned int fragment; ++ unsigned int offset; ++ unsigned int file_size; ++ unsigned short block_list[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_lreg_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ unsigned int nlink; ++ squashfs_block_t start_block; ++ unsigned int fragment; ++ unsigned int offset; ++ long long file_size; ++ unsigned short block_list[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_dir_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ unsigned int nlink; ++ unsigned int file_size:19; ++ unsigned int offset:13; ++ unsigned int start_block; ++ unsigned int parent_inode; ++} __attribute__ ((packed)); ++ ++struct squashfs_ldir_inode_header { ++ SQUASHFS_BASE_INODE_HEADER; ++ unsigned int nlink; ++ unsigned int file_size:27; ++ unsigned int offset:13; ++ unsigned int start_block; ++ unsigned int i_count:16; ++ unsigned int parent_inode; ++ struct squashfs_dir_index index[0]; ++} __attribute__ ((packed)); ++ ++union squashfs_inode_header { ++ struct squashfs_base_inode_header base; ++ struct squashfs_dev_inode_header dev; ++ struct squashfs_symlink_inode_header symlink; ++ struct squashfs_reg_inode_header reg; ++ struct squashfs_lreg_inode_header lreg; ++ struct squashfs_dir_inode_header dir; ++ struct squashfs_ldir_inode_header ldir; ++ struct squashfs_ipc_inode_header ipc; ++}; ++ ++struct squashfs_dir_entry { ++ unsigned int offset:13; ++ unsigned int type:3; ++ unsigned int size:8; ++ int inode_number:16; ++ char name[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_dir_header { ++ unsigned int count:8; ++ unsigned int start_block; ++ unsigned int inode_number; ++} __attribute__ ((packed)); ++ ++struct squashfs_fragment_entry { ++ long long start_block; ++ unsigned int size; ++ unsigned int pending; ++} __attribute__ ((packed)); ++ ++extern int squashfs_uncompress_block(void *d, int dstlen, void *s, int srclen); ++extern int squashfs_uncompress_init(void); ++extern int squashfs_uncompress_exit(void); ++ ++/* ++ * macros to convert each packed bitfield structure from little endian to big ++ * endian and vice versa. These are needed when creating or using a filesystem ++ * on a machine with different byte ordering to the target architecture. ++ * ++ */ ++ ++#define SQUASHFS_SWAP_START \ ++ int bits;\ ++ int b_pos;\ ++ unsigned long long val;\ ++ unsigned char *s;\ ++ unsigned char *d; ++ ++#define SQUASHFS_SWAP_SUPER_BLOCK(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_super_block));\ ++ SQUASHFS_SWAP((s)->s_magic, d, 0, 32);\ ++ SQUASHFS_SWAP((s)->inodes, d, 32, 32);\ ++ SQUASHFS_SWAP((s)->bytes_used_2, d, 64, 32);\ ++ SQUASHFS_SWAP((s)->uid_start_2, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->guid_start_2, d, 128, 32);\ ++ SQUASHFS_SWAP((s)->inode_table_start_2, d, 160, 32);\ ++ SQUASHFS_SWAP((s)->directory_table_start_2, d, 192, 32);\ ++ SQUASHFS_SWAP((s)->s_major, d, 224, 16);\ ++ SQUASHFS_SWAP((s)->s_minor, d, 240, 16);\ ++ SQUASHFS_SWAP((s)->block_size_1, d, 256, 16);\ ++ SQUASHFS_SWAP((s)->block_log, d, 272, 16);\ ++ SQUASHFS_SWAP((s)->flags, d, 288, 8);\ ++ SQUASHFS_SWAP((s)->no_uids, d, 296, 8);\ ++ SQUASHFS_SWAP((s)->no_guids, d, 304, 8);\ ++ SQUASHFS_SWAP((s)->mkfs_time, d, 312, 32);\ ++ SQUASHFS_SWAP((s)->root_inode, d, 344, 64);\ ++ SQUASHFS_SWAP((s)->block_size, d, 408, 32);\ ++ SQUASHFS_SWAP((s)->fragments, d, 440, 32);\ ++ SQUASHFS_SWAP((s)->fragment_table_start_2, d, 472, 32);\ ++ SQUASHFS_SWAP((s)->bytes_used, d, 504, 64);\ ++ SQUASHFS_SWAP((s)->uid_start, d, 568, 64);\ ++ SQUASHFS_SWAP((s)->guid_start, d, 632, 64);\ ++ SQUASHFS_SWAP((s)->inode_table_start, d, 696, 64);\ ++ SQUASHFS_SWAP((s)->directory_table_start, d, 760, 64);\ ++ SQUASHFS_SWAP((s)->fragment_table_start, d, 824, 64);\ ++ SQUASHFS_SWAP((s)->lookup_table_start, d, 888, 64);\ ++} ++ ++#define SQUASHFS_SWAP_BASE_INODE_CORE(s, d, n)\ ++ SQUASHFS_MEMSET(s, d, n);\ ++ SQUASHFS_SWAP((s)->inode_type, d, 0, 4);\ ++ SQUASHFS_SWAP((s)->mode, d, 4, 12);\ ++ SQUASHFS_SWAP((s)->uid, d, 16, 8);\ ++ SQUASHFS_SWAP((s)->guid, d, 24, 8);\ ++ SQUASHFS_SWAP((s)->mtime, d, 32, 32);\ ++ SQUASHFS_SWAP((s)->inode_number, d, 64, 32); ++ ++#define SQUASHFS_SWAP_BASE_INODE_HEADER(s, d, n) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, n)\ ++} ++ ++#define SQUASHFS_SWAP_IPC_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_ipc_inode_header))\ ++ SQUASHFS_SWAP((s)->nlink, d, 96, 32);\ ++} ++ ++#define SQUASHFS_SWAP_DEV_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_dev_inode_header)); \ ++ SQUASHFS_SWAP((s)->nlink, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->rdev, d, 128, 16);\ ++} ++ ++#define SQUASHFS_SWAP_SYMLINK_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_symlink_inode_header));\ ++ SQUASHFS_SWAP((s)->nlink, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->symlink_size, d, 128, 16);\ ++} ++ ++#define SQUASHFS_SWAP_REG_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_reg_inode_header));\ ++ SQUASHFS_SWAP((s)->start_block, d, 96, 64);\ ++ SQUASHFS_SWAP((s)->fragment, d, 160, 32);\ ++ SQUASHFS_SWAP((s)->offset, d, 192, 32);\ ++ SQUASHFS_SWAP((s)->file_size, d, 224, 32);\ ++} ++ ++#define SQUASHFS_SWAP_LREG_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_lreg_inode_header));\ ++ SQUASHFS_SWAP((s)->nlink, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 128, 64);\ ++ SQUASHFS_SWAP((s)->fragment, d, 192, 32);\ ++ SQUASHFS_SWAP((s)->offset, d, 224, 32);\ ++ SQUASHFS_SWAP((s)->file_size, d, 256, 64);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_dir_inode_header));\ ++ SQUASHFS_SWAP((s)->nlink, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->file_size, d, 128, 19);\ ++ SQUASHFS_SWAP((s)->offset, d, 147, 13);\ ++ SQUASHFS_SWAP((s)->start_block, d, 160, 32);\ ++ SQUASHFS_SWAP((s)->parent_inode, d, 192, 32);\ ++} ++ ++#define SQUASHFS_SWAP_LDIR_INODE_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE(s, d, \ ++ sizeof(struct squashfs_ldir_inode_header));\ ++ SQUASHFS_SWAP((s)->nlink, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->file_size, d, 128, 27);\ ++ SQUASHFS_SWAP((s)->offset, d, 155, 13);\ ++ SQUASHFS_SWAP((s)->start_block, d, 168, 32);\ ++ SQUASHFS_SWAP((s)->i_count, d, 200, 16);\ ++ SQUASHFS_SWAP((s)->parent_inode, d, 216, 32);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_INDEX(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_dir_index));\ ++ SQUASHFS_SWAP((s)->index, d, 0, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 32, 32);\ ++ SQUASHFS_SWAP((s)->size, d, 64, 8);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_HEADER(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_dir_header));\ ++ SQUASHFS_SWAP((s)->count, d, 0, 8);\ ++ SQUASHFS_SWAP((s)->start_block, d, 8, 32);\ ++ SQUASHFS_SWAP((s)->inode_number, d, 40, 32);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_ENTRY(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_dir_entry));\ ++ SQUASHFS_SWAP((s)->offset, d, 0, 13);\ ++ SQUASHFS_SWAP((s)->type, d, 13, 3);\ ++ SQUASHFS_SWAP((s)->size, d, 16, 8);\ ++ SQUASHFS_SWAP((s)->inode_number, d, 24, 16);\ ++} ++ ++#define SQUASHFS_SWAP_FRAGMENT_ENTRY(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_fragment_entry));\ ++ SQUASHFS_SWAP((s)->start_block, d, 0, 64);\ ++ SQUASHFS_SWAP((s)->size, d, 64, 32);\ ++} ++ ++#define SQUASHFS_SWAP_INODE_T(s, d) SQUASHFS_SWAP_LONG_LONGS(s, d, 1) ++ ++#define SQUASHFS_SWAP_SHORTS(s, d, n) {\ ++ int entry;\ ++ int bit_position;\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, n * 2);\ ++ for(entry = 0, bit_position = 0; entry < n; entry++, bit_position += \ ++ 16)\ ++ SQUASHFS_SWAP(s[entry], d, bit_position, 16);\ ++} ++ ++#define SQUASHFS_SWAP_INTS(s, d, n) {\ ++ int entry;\ ++ int bit_position;\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, n * 4);\ ++ for(entry = 0, bit_position = 0; entry < n; entry++, bit_position += \ ++ 32)\ ++ SQUASHFS_SWAP(s[entry], d, bit_position, 32);\ ++} ++ ++#define SQUASHFS_SWAP_LONG_LONGS(s, d, n) {\ ++ int entry;\ ++ int bit_position;\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, n * 8);\ ++ for(entry = 0, bit_position = 0; entry < n; entry++, bit_position += \ ++ 64)\ ++ SQUASHFS_SWAP(s[entry], d, bit_position, 64);\ ++} ++ ++#define SQUASHFS_SWAP_DATA(s, d, n, bits) {\ ++ int entry;\ ++ int bit_position;\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, n * bits / 8);\ ++ for(entry = 0, bit_position = 0; entry < n; entry++, bit_position += \ ++ bits)\ ++ SQUASHFS_SWAP(s[entry], d, bit_position, bits);\ ++} ++ ++#define SQUASHFS_SWAP_FRAGMENT_INDEXES(s, d, n) SQUASHFS_SWAP_LONG_LONGS(s, d, n) ++#define SQUASHFS_SWAP_LOOKUP_BLOCKS(s, d, n) SQUASHFS_SWAP_LONG_LONGS(s, d, n) ++ ++#ifdef CONFIG_SQUASHFS_1_0_COMPATIBILITY ++ ++struct squashfs_base_inode_header_1 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:4; /* index into uid table */ ++ unsigned int guid:4; /* index into guid table */ ++} __attribute__ ((packed)); ++ ++struct squashfs_ipc_inode_header_1 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:4; /* index into uid table */ ++ unsigned int guid:4; /* index into guid table */ ++ unsigned int type:4; ++ unsigned int offset:4; ++} __attribute__ ((packed)); ++ ++struct squashfs_dev_inode_header_1 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:4; /* index into uid table */ ++ unsigned int guid:4; /* index into guid table */ ++ unsigned short rdev; ++} __attribute__ ((packed)); ++ ++struct squashfs_symlink_inode_header_1 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:4; /* index into uid table */ ++ unsigned int guid:4; /* index into guid table */ ++ unsigned short symlink_size; ++ char symlink[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_reg_inode_header_1 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:4; /* index into uid table */ ++ unsigned int guid:4; /* index into guid table */ ++ unsigned int mtime; ++ unsigned int start_block; ++ unsigned int file_size:32; ++ unsigned short block_list[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_dir_inode_header_1 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:4; /* index into uid table */ ++ unsigned int guid:4; /* index into guid table */ ++ unsigned int file_size:19; ++ unsigned int offset:13; ++ unsigned int mtime; ++ unsigned int start_block:24; ++} __attribute__ ((packed)); ++ ++#define SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, n) \ ++ SQUASHFS_MEMSET(s, d, n);\ ++ SQUASHFS_SWAP((s)->inode_type, d, 0, 4);\ ++ SQUASHFS_SWAP((s)->mode, d, 4, 12);\ ++ SQUASHFS_SWAP((s)->uid, d, 16, 4);\ ++ SQUASHFS_SWAP((s)->guid, d, 20, 4); ++ ++#define SQUASHFS_SWAP_BASE_INODE_HEADER_1(s, d, n) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, n)\ ++} ++ ++#define SQUASHFS_SWAP_IPC_INODE_HEADER_1(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, \ ++ sizeof(struct squashfs_ipc_inode_header_1));\ ++ SQUASHFS_SWAP((s)->type, d, 24, 4);\ ++ SQUASHFS_SWAP((s)->offset, d, 28, 4);\ ++} ++ ++#define SQUASHFS_SWAP_DEV_INODE_HEADER_1(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, \ ++ sizeof(struct squashfs_dev_inode_header_1));\ ++ SQUASHFS_SWAP((s)->rdev, d, 24, 16);\ ++} ++ ++#define SQUASHFS_SWAP_SYMLINK_INODE_HEADER_1(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, \ ++ sizeof(struct squashfs_symlink_inode_header_1));\ ++ SQUASHFS_SWAP((s)->symlink_size, d, 24, 16);\ ++} ++ ++#define SQUASHFS_SWAP_REG_INODE_HEADER_1(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, \ ++ sizeof(struct squashfs_reg_inode_header_1));\ ++ SQUASHFS_SWAP((s)->mtime, d, 24, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 56, 32);\ ++ SQUASHFS_SWAP((s)->file_size, d, 88, 32);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_INODE_HEADER_1(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_1(s, d, \ ++ sizeof(struct squashfs_dir_inode_header_1));\ ++ SQUASHFS_SWAP((s)->file_size, d, 24, 19);\ ++ SQUASHFS_SWAP((s)->offset, d, 43, 13);\ ++ SQUASHFS_SWAP((s)->mtime, d, 56, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 88, 24);\ ++} ++ ++#endif ++ ++#ifdef CONFIG_SQUASHFS_2_0_COMPATIBILITY ++ ++struct squashfs_dir_index_2 { ++ unsigned int index:27; ++ unsigned int start_block:29; ++ unsigned char size; ++ unsigned char name[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_base_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++} __attribute__ ((packed)); ++ ++struct squashfs_ipc_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++} __attribute__ ((packed)); ++ ++struct squashfs_dev_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++ unsigned short rdev; ++} __attribute__ ((packed)); ++ ++struct squashfs_symlink_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++ unsigned short symlink_size; ++ char symlink[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_reg_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++ unsigned int mtime; ++ unsigned int start_block; ++ unsigned int fragment; ++ unsigned int offset; ++ unsigned int file_size:32; ++ unsigned short block_list[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_dir_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++ unsigned int file_size:19; ++ unsigned int offset:13; ++ unsigned int mtime; ++ unsigned int start_block:24; ++} __attribute__ ((packed)); ++ ++struct squashfs_ldir_inode_header_2 { ++ unsigned int inode_type:4; ++ unsigned int mode:12; /* protection */ ++ unsigned int uid:8; /* index into uid table */ ++ unsigned int guid:8; /* index into guid table */ ++ unsigned int file_size:27; ++ unsigned int offset:13; ++ unsigned int mtime; ++ unsigned int start_block:24; ++ unsigned int i_count:16; ++ struct squashfs_dir_index_2 index[0]; ++} __attribute__ ((packed)); ++ ++union squashfs_inode_header_2 { ++ struct squashfs_base_inode_header_2 base; ++ struct squashfs_dev_inode_header_2 dev; ++ struct squashfs_symlink_inode_header_2 symlink; ++ struct squashfs_reg_inode_header_2 reg; ++ struct squashfs_dir_inode_header_2 dir; ++ struct squashfs_ldir_inode_header_2 ldir; ++ struct squashfs_ipc_inode_header_2 ipc; ++}; ++ ++struct squashfs_dir_header_2 { ++ unsigned int count:8; ++ unsigned int start_block:24; ++} __attribute__ ((packed)); ++ ++struct squashfs_dir_entry_2 { ++ unsigned int offset:13; ++ unsigned int type:3; ++ unsigned int size:8; ++ char name[0]; ++} __attribute__ ((packed)); ++ ++struct squashfs_fragment_entry_2 { ++ unsigned int start_block; ++ unsigned int size; ++} __attribute__ ((packed)); ++ ++#define SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, n)\ ++ SQUASHFS_MEMSET(s, d, n);\ ++ SQUASHFS_SWAP((s)->inode_type, d, 0, 4);\ ++ SQUASHFS_SWAP((s)->mode, d, 4, 12);\ ++ SQUASHFS_SWAP((s)->uid, d, 16, 8);\ ++ SQUASHFS_SWAP((s)->guid, d, 24, 8);\ ++ ++#define SQUASHFS_SWAP_BASE_INODE_HEADER_2(s, d, n) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, n)\ ++} ++ ++#define SQUASHFS_SWAP_IPC_INODE_HEADER_2(s, d) \ ++ SQUASHFS_SWAP_BASE_INODE_HEADER_2(s, d, sizeof(struct squashfs_ipc_inode_header_2)) ++ ++#define SQUASHFS_SWAP_DEV_INODE_HEADER_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, \ ++ sizeof(struct squashfs_dev_inode_header_2)); \ ++ SQUASHFS_SWAP((s)->rdev, d, 32, 16);\ ++} ++ ++#define SQUASHFS_SWAP_SYMLINK_INODE_HEADER_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, \ ++ sizeof(struct squashfs_symlink_inode_header_2));\ ++ SQUASHFS_SWAP((s)->symlink_size, d, 32, 16);\ ++} ++ ++#define SQUASHFS_SWAP_REG_INODE_HEADER_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, \ ++ sizeof(struct squashfs_reg_inode_header_2));\ ++ SQUASHFS_SWAP((s)->mtime, d, 32, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 64, 32);\ ++ SQUASHFS_SWAP((s)->fragment, d, 96, 32);\ ++ SQUASHFS_SWAP((s)->offset, d, 128, 32);\ ++ SQUASHFS_SWAP((s)->file_size, d, 160, 32);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_INODE_HEADER_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, \ ++ sizeof(struct squashfs_dir_inode_header_2));\ ++ SQUASHFS_SWAP((s)->file_size, d, 32, 19);\ ++ SQUASHFS_SWAP((s)->offset, d, 51, 13);\ ++ SQUASHFS_SWAP((s)->mtime, d, 64, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 96, 24);\ ++} ++ ++#define SQUASHFS_SWAP_LDIR_INODE_HEADER_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_SWAP_BASE_INODE_CORE_2(s, d, \ ++ sizeof(struct squashfs_ldir_inode_header_2));\ ++ SQUASHFS_SWAP((s)->file_size, d, 32, 27);\ ++ SQUASHFS_SWAP((s)->offset, d, 59, 13);\ ++ SQUASHFS_SWAP((s)->mtime, d, 72, 32);\ ++ SQUASHFS_SWAP((s)->start_block, d, 104, 24);\ ++ SQUASHFS_SWAP((s)->i_count, d, 128, 16);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_INDEX_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_dir_index_2));\ ++ SQUASHFS_SWAP((s)->index, d, 0, 27);\ ++ SQUASHFS_SWAP((s)->start_block, d, 27, 29);\ ++ SQUASHFS_SWAP((s)->size, d, 56, 8);\ ++} ++#define SQUASHFS_SWAP_DIR_HEADER_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_dir_header_2));\ ++ SQUASHFS_SWAP((s)->count, d, 0, 8);\ ++ SQUASHFS_SWAP((s)->start_block, d, 8, 24);\ ++} ++ ++#define SQUASHFS_SWAP_DIR_ENTRY_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_dir_entry_2));\ ++ SQUASHFS_SWAP((s)->offset, d, 0, 13);\ ++ SQUASHFS_SWAP((s)->type, d, 13, 3);\ ++ SQUASHFS_SWAP((s)->size, d, 16, 8);\ ++} ++ ++#define SQUASHFS_SWAP_FRAGMENT_ENTRY_2(s, d) {\ ++ SQUASHFS_SWAP_START\ ++ SQUASHFS_MEMSET(s, d, sizeof(struct squashfs_fragment_entry_2));\ ++ SQUASHFS_SWAP((s)->start_block, d, 0, 32);\ ++ SQUASHFS_SWAP((s)->size, d, 32, 32);\ ++} ++ ++#define SQUASHFS_SWAP_FRAGMENT_INDEXES_2(s, d, n) SQUASHFS_SWAP_INTS(s, d, n) ++ ++/* fragment and fragment table defines */ ++#define SQUASHFS_FRAGMENT_BYTES_2(A) (A * sizeof(struct squashfs_fragment_entry_2)) ++ ++#define SQUASHFS_FRAGMENT_INDEX_2(A) (SQUASHFS_FRAGMENT_BYTES_2(A) / \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_FRAGMENT_INDEX_OFFSET_2(A) (SQUASHFS_FRAGMENT_BYTES_2(A) % \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_FRAGMENT_INDEXES_2(A) ((SQUASHFS_FRAGMENT_BYTES_2(A) + \ ++ SQUASHFS_METADATA_SIZE - 1) / \ ++ SQUASHFS_METADATA_SIZE) ++ ++#define SQUASHFS_FRAGMENT_INDEX_BYTES_2(A) (SQUASHFS_FRAGMENT_INDEXES_2(A) *\ ++ sizeof(int)) ++ ++#endif ++ ++#ifdef __KERNEL__ ++ ++/* ++ * macros used to swap each structure entry, taking into account ++ * bitfields and different bitfield placing conventions on differing ++ * architectures ++ */ ++ ++#include <asm/byteorder.h> ++ ++#ifdef __BIG_ENDIAN ++ /* convert from little endian to big endian */ ++#define SQUASHFS_SWAP(value, p, pos, tbits) _SQUASHFS_SWAP(value, p, pos, \ ++ tbits, b_pos) ++#else ++ /* convert from big endian to little endian */ ++#define SQUASHFS_SWAP(value, p, pos, tbits) _SQUASHFS_SWAP(value, p, pos, \ ++ tbits, 64 - tbits - b_pos) ++#endif ++ ++#define _SQUASHFS_SWAP(value, p, pos, tbits, SHIFT) {\ ++ b_pos = pos % 8;\ ++ val = 0;\ ++ s = (unsigned char *)p + (pos / 8);\ ++ d = ((unsigned char *) &val) + 7;\ ++ for(bits = 0; bits < (tbits + b_pos); bits += 8) \ ++ *d-- = *s++;\ ++ value = (val >> (SHIFT))/* & ((1 << tbits) - 1)*/;\ ++} ++ ++#define SQUASHFS_MEMSET(s, d, n) memset(s, 0, n); ++ ++#endif ++#endif +diff --git a/include/linux/squashfs_fs_i.h b/include/linux/squashfs_fs_i.h +new file mode 100644 +index 0000000..798891a +--- /dev/null ++++ b/include/linux/squashfs_fs_i.h +@@ -0,0 +1,45 @@ ++#ifndef SQUASHFS_FS_I ++#define SQUASHFS_FS_I ++/* ++ * Squashfs ++ * ++ * Copyright (c) 2002, 2003, 2004, 2005, 2006, 2007 ++ * Phillip Lougher <phillip@lougher.org.uk> ++ * ++ * This program is free software; you can redistribute it and/or ++ * modify it under the terms of the GNU General Public License ++ * as published by the Free Software Foundation; either version 2, ++ * or (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. ++ * ++ * squashfs_fs_i.h ++ */ ++ ++struct squashfs_inode_info { ++ long long start_block; ++ unsigned int offset; ++ union { ++ struct { ++ long long fragment_start_block; ++ unsigned int fragment_size; ++ unsigned int fragment_offset; ++ long long block_list_start; ++ } s1; ++ struct { ++ long long directory_index_start; ++ unsigned int directory_index_offset; ++ unsigned int directory_index_count; ++ unsigned int parent_inode; ++ } s2; ++ } u; ++ struct inode vfs_inode; ++}; ++#endif +diff --git a/include/linux/squashfs_fs_sb.h b/include/linux/squashfs_fs_sb.h +new file mode 100644 +index 0000000..8f3bf99 +--- /dev/null ++++ b/include/linux/squashfs_fs_sb.h +@@ -0,0 +1,74 @@ ++#ifndef SQUASHFS_FS_SB ++#define SQUASHFS_FS_SB ++/* ++ * Squashfs ++ * ++ * Copyright (c) 2002, 2003, 2004, 2005, 2006, 2007 ++ * Phillip Lougher <phillip@lougher.org.uk> ++ * ++ * This program is free software; you can redistribute it and/or ++ * modify it under the terms of the GNU General Public License ++ * as published by the Free Software Foundation; either version 2, ++ * or (at your option) any later version. ++ * ++ * This program is distributed in the hope that it will be useful, ++ * but WITHOUT ANY WARRANTY; without even the implied warranty of ++ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ++ * GNU General Public License for more details. ++ * ++ * You should have received a copy of the GNU General Public License ++ * along with this program; if not, write to the Free Software ++ * Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. ++ * ++ * squashfs_fs_sb.h ++ */ ++ ++#include <linux/squashfs_fs.h> ++ ++struct squashfs_cache { ++ long long block; ++ int length; ++ long long next_index; ++ char *data; ++}; ++ ++struct squashfs_fragment_cache { ++ long long block; ++ int length; ++ unsigned int locked; ++ char *data; ++}; ++ ++struct squashfs_sb_info { ++ struct squashfs_super_block sblk; ++ int devblksize; ++ int devblksize_log2; ++ int swap; ++ struct squashfs_cache *block_cache; ++ struct squashfs_fragment_cache *fragment; ++ int next_cache; ++ int next_fragment; ++ int next_meta_index; ++ unsigned int *uid; ++ unsigned int *guid; ++ long long *fragment_index; ++ unsigned int *fragment_index_2; ++ char *read_page; ++ struct mutex read_data_mutex; ++ struct mutex read_page_mutex; ++ struct mutex block_cache_mutex; ++ struct mutex fragment_mutex; ++ struct mutex meta_index_mutex; ++ wait_queue_head_t waitq; ++ wait_queue_head_t fragment_wait_queue; ++ struct meta_index *meta_index; ++ z_stream stream; ++ long long *inode_lookup_table; ++ int (*read_inode)(struct inode *i, squashfs_inode_t \ ++ inode); ++ long long (*read_blocklist)(struct inode *inode, int \ ++ index, int readahead_blks, char *block_list, \ ++ unsigned short **block_p, unsigned int *bsize); ++ int (*read_fragment_index_table)(struct super_block *s); ++}; ++#endif +diff --git a/init/Kconfig b/init/Kconfig +index b170aa1..bcfc3b4 100644 +--- a/init/Kconfig ++++ b/init/Kconfig +@@ -244,23 +244,21 @@ config AUDITSYSCALL + ensure that INOTIFY is configured. + + config IKCONFIG +- tristate "Kernel .config support" ++ tristate "Kernel .miniconfig support" + ---help--- +- This option enables the complete Linux kernel ".config" file ++ This option enables the mini Linux kernel ".miniconfig" file + contents to be saved in the kernel. It provides documentation + of which kernel options are used in a running kernel or in an +- on-disk kernel. This information can be extracted from the kernel +- image file with the script scripts/extract-ikconfig and used as +- input to rebuild the current kernel or to build another kernel. +- It can also be extracted from a running kernel by reading +- /proc/config.gz if enabled (below). ++ on-disk kernel. ++ It can be extracted from a running kernel by reading ++ /proc/miniconfig.gz if enabled (below). + + config IKCONFIG_PROC +- bool "Enable access to .config through /proc/config.gz" ++ bool "Enable access to .miniconfig through /proc/miniconfig.gz" + depends on IKCONFIG && PROC_FS + ---help--- + This option enables access to the kernel configuration file +- through /proc/config.gz. ++ through /proc/miniconfig.gz. + + config CPUSETS + bool "Cpuset support" +diff --git a/init/LzmaDecode.c b/init/LzmaDecode.c +new file mode 100644 +index 0000000..21bf40b +--- /dev/null ++++ b/init/LzmaDecode.c +@@ -0,0 +1,588 @@ ++/* ++ LzmaDecode.c ++ LZMA Decoder (optimized for Speed version) ++ ++ LZMA SDK 4.22 Copyright (c) 1999-2005 Igor Pavlov (2005-06-10) ++ http://www.7-zip.org/ ++ ++ LZMA SDK is licensed under two licenses: ++ 1) GNU Lesser General Public License (GNU LGPL) ++ 2) Common Public License (CPL) ++ It means that you can select one of these two licenses and ++ follow rules of that license. ++ ++ SPECIAL EXCEPTION: ++ Igor Pavlov, as the author of this Code, expressly permits you to ++ statically or dynamically link your Code (or bind by name) to the ++ interfaces of this file without subjecting your linked Code to the ++ terms of the CPL or GNU LGPL. Any modifications or additions ++ to this file, however, are subject to the LGPL or CPL terms. ++*/ ++ ++#include "LzmaDecode.h" ++ ++#ifndef Byte ++#define Byte unsigned char ++#endif ++ ++#define kNumTopBits 24 ++#define kTopValue ((UInt32)1 << kNumTopBits) ++ ++#define kNumBitModelTotalBits 11 ++#define kBitModelTotal (1 << kNumBitModelTotalBits) ++#define kNumMoveBits 5 ++ ++#define RC_READ_BYTE (*Buffer++) ++ ++#define RC_INIT2 Code = 0; Range = 0xFFFFFFFF; \ ++ { int i; for(i = 0; i < 5; i++) { RC_TEST; Code = (Code << 8) | RC_READ_BYTE; }} ++ ++#ifdef _LZMA_IN_CB ++ ++#define RC_TEST { if (Buffer == BufferLim) \ ++ { SizeT size; int result = InCallback->Read(InCallback, &Buffer, &size); if (result != LZMA_RESULT_OK) return result; \ ++ BufferLim = Buffer + size; if (size == 0) return LZMA_RESULT_DATA_ERROR; }} ++ ++#define RC_INIT Buffer = BufferLim = 0; RC_INIT2 ++ ++#else ++ ++#define RC_TEST { if (Buffer == BufferLim) return LZMA_RESULT_DATA_ERROR; } ++ ++#define RC_INIT(buffer, bufferSize) Buffer = buffer; BufferLim = buffer + bufferSize; RC_INIT2 ++ ++#endif ++ ++#define RC_NORMALIZE if (Range < kTopValue) { RC_TEST; Range <<= 8; Code = (Code << 8) | RC_READ_BYTE; } ++ ++#define IfBit0(p) RC_NORMALIZE; bound = (Range >> kNumBitModelTotalBits) * *(p); if (Code < bound) ++#define UpdateBit0(p) Range = bound; *(p) += (kBitModelTotal - *(p)) >> kNumMoveBits; ++#define UpdateBit1(p) Range -= bound; Code -= bound; *(p) -= (*(p)) >> kNumMoveBits; ++ ++#define RC_GET_BIT2(p, mi, A0, A1) IfBit0(p) \ ++ { UpdateBit0(p); mi <<= 1; A0; } else \ ++ { UpdateBit1(p); mi = (mi + mi) + 1; A1; } ++ ++#define RC_GET_BIT(p, mi) RC_GET_BIT2(p, mi, ; , ;) ++ ++#define RangeDecoderBitTreeDecode(probs, numLevels, res) \ ++ { int i = numLevels; res = 1; \ ++ do { CProb *p = probs + res; RC_GET_BIT(p, res) } while(--i != 0); \ ++ res -= (1 << numLevels); } ++ ++ ++#define kNumPosBitsMax 4 ++#define kNumPosStatesMax (1 << kNumPosBitsMax) ++ ++#define kLenNumLowBits 3 ++#define kLenNumLowSymbols (1 << kLenNumLowBits) ++#define kLenNumMidBits 3 ++#define kLenNumMidSymbols (1 << kLenNumMidBits) ++#define kLenNumHighBits 8 ++#define kLenNumHighSymbols (1 << kLenNumHighBits) ++ ++#define LenChoice 0 ++#define LenChoice2 (LenChoice + 1) ++#define LenLow (LenChoice2 + 1) ++#define LenMid (LenLow + (kNumPosStatesMax << kLenNumLowBits)) ++#define LenHigh (LenMid + (kNumPosStatesMax << kLenNumMidBits)) ++#define kNumLenProbs (LenHigh + kLenNumHighSymbols) ++ ++ ++#define kNumStates 12 ++#define kNumLitStates 7 ++ ++#define kStartPosModelIndex 4 ++#define kEndPosModelIndex 14 ++#define kNumFullDistances (1 << (kEndPosModelIndex >> 1)) ++ ++#define kNumPosSlotBits 6 ++#define kNumLenToPosStates 4 ++ ++#define kNumAlignBits 4 ++#define kAlignTableSize (1 << kNumAlignBits) ++ ++#define kMatchMinLen 2 ++ ++#define IsMatch 0 ++#define IsRep (IsMatch + (kNumStates << kNumPosBitsMax)) ++#define IsRepG0 (IsRep + kNumStates) ++#define IsRepG1 (IsRepG0 + kNumStates) ++#define IsRepG2 (IsRepG1 + kNumStates) ++#define IsRep0Long (IsRepG2 + kNumStates) ++#define PosSlot (IsRep0Long + (kNumStates << kNumPosBitsMax)) ++#define SpecPos (PosSlot + (kNumLenToPosStates << kNumPosSlotBits)) ++#define Align (SpecPos + kNumFullDistances - kEndPosModelIndex) ++#define LenCoder (Align + kAlignTableSize) ++#define RepLenCoder (LenCoder + kNumLenProbs) ++#define Literal (RepLenCoder + kNumLenProbs) ++ ++#if Literal != LZMA_BASE_SIZE ++StopCompilingDueBUG ++#endif ++ ++int LzmaDecodeProperties(CLzmaProperties *propsRes, const unsigned char *propsData, int size) ++{ ++ unsigned char prop0; ++ if (size < LZMA_PROPERTIES_SIZE) ++ return LZMA_RESULT_DATA_ERROR; ++ prop0 = propsData[0]; ++ if (prop0 >= (9 * 5 * 5)) ++ return LZMA_RESULT_DATA_ERROR; ++ { ++ for (propsRes->pb = 0; prop0 >= (9 * 5); propsRes->pb++, prop0 -= (9 * 5)); ++ for (propsRes->lp = 0; prop0 >= 9; propsRes->lp++, prop0 -= 9); ++ propsRes->lc = prop0; ++ /* ++ unsigned char remainder = (unsigned char)(prop0 / 9); ++ propsRes->lc = prop0 % 9; ++ propsRes->pb = remainder / 5; ++ propsRes->lp = remainder % 5; ++ */ ++ } ++ ++ #ifdef _LZMA_OUT_READ ++ { ++ int i; ++ propsRes->DictionarySize = 0; ++ for (i = 0; i < 4; i++) ++ propsRes->DictionarySize += (UInt32)(propsData[1 + i]) << (i * 8); ++ if (propsRes->DictionarySize == 0) ++ propsRes->DictionarySize = 1; ++ } ++ #endif ++ return LZMA_RESULT_OK; ++} ++ ++#define kLzmaStreamWasFinishedId (-1) ++ ++int LzmaDecode(CLzmaDecoderState *vs, ++ #ifdef _LZMA_IN_CB ++ ILzmaInCallback *InCallback, ++ #else ++ const unsigned char *inStream, SizeT inSize, SizeT *inSizeProcessed, ++ #endif ++ unsigned char *outStream, SizeT outSize, SizeT *outSizeProcessed) ++{ ++ CProb *p = vs->Probs; ++ SizeT nowPos = 0; ++ Byte previousByte = 0; ++ UInt32 posStateMask = (1 << (vs->Properties.pb)) - 1; ++ UInt32 literalPosMask = (1 << (vs->Properties.lp)) - 1; ++ int lc = vs->Properties.lc; ++ ++ #ifdef _LZMA_OUT_READ ++ ++ UInt32 Range = vs->Range; ++ UInt32 Code = vs->Code; ++ #ifdef _LZMA_IN_CB ++ const Byte *Buffer = vs->Buffer; ++ const Byte *BufferLim = vs->BufferLim; ++ #else ++ const Byte *Buffer = inStream; ++ const Byte *BufferLim = inStream + inSize; ++ #endif ++ int state = vs->State; ++ UInt32 rep0 = vs->Reps[0], rep1 = vs->Reps[1], rep2 = vs->Reps[2], rep3 = vs->Reps[3]; ++ int len = vs->RemainLen; ++ UInt32 globalPos = vs->GlobalPos; ++ UInt32 distanceLimit = vs->DistanceLimit; ++ ++ Byte *dictionary = vs->Dictionary; ++ UInt32 dictionarySize = vs->Properties.DictionarySize; ++ UInt32 dictionaryPos = vs->DictionaryPos; ++ ++ Byte tempDictionary[4]; ++ ++ #ifndef _LZMA_IN_CB ++ *inSizeProcessed = 0; ++ #endif ++ *outSizeProcessed = 0; ++ if (len == kLzmaStreamWasFinishedId) ++ return LZMA_RESULT_OK; ++ ++ if (dictionarySize == 0) ++ { ++ dictionary = tempDictionary; ++ dictionarySize = 1; ++ tempDictionary[0] = vs->TempDictionary[0]; ++ } ++ ++ if (len == kLzmaNeedInitId) ++ { ++ { ++ UInt32 numProbs = Literal + ((UInt32)LZMA_LIT_SIZE << (lc + vs->Properties.lp)); ++ UInt32 i; ++ for (i = 0; i < numProbs; i++) ++ p[i] = kBitModelTotal >> 1; ++ rep0 = rep1 = rep2 = rep3 = 1; ++ state = 0; ++ globalPos = 0; ++ distanceLimit = 0; ++ dictionaryPos = 0; ++ dictionary[dictionarySize - 1] = 0; ++ #ifdef _LZMA_IN_CB ++ RC_INIT; ++ #else ++ RC_INIT(inStream, inSize); ++ #endif ++ } ++ len = 0; ++ } ++ while(len != 0 && nowPos < outSize) ++ { ++ UInt32 pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ outStream[nowPos++] = dictionary[dictionaryPos] = dictionary[pos]; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ len--; ++ } ++ if (dictionaryPos == 0) ++ previousByte = dictionary[dictionarySize - 1]; ++ else ++ previousByte = dictionary[dictionaryPos - 1]; ++ ++ #else /* if !_LZMA_OUT_READ */ ++ ++ int state = 0; ++ UInt32 rep0 = 1, rep1 = 1, rep2 = 1, rep3 = 1; ++ int len = 0; ++ const Byte *Buffer; ++ const Byte *BufferLim; ++ UInt32 Range; ++ UInt32 Code; ++ ++ #ifndef _LZMA_IN_CB ++ *inSizeProcessed = 0; ++ #endif ++ *outSizeProcessed = 0; ++ ++ { ++ UInt32 i; ++ UInt32 numProbs = Literal + ((UInt32)LZMA_LIT_SIZE << (lc + vs->Properties.lp)); ++ for (i = 0; i < numProbs; i++) ++ p[i] = kBitModelTotal >> 1; ++ } ++ ++ #ifdef _LZMA_IN_CB ++ RC_INIT; ++ #else ++ RC_INIT(inStream, inSize); ++ #endif ++ ++ #endif /* _LZMA_OUT_READ */ ++ ++ while(nowPos < outSize) ++ { ++ CProb *prob; ++ UInt32 bound; ++ int posState = (int)( ++ (nowPos ++ #ifdef _LZMA_OUT_READ ++ + globalPos ++ #endif ++ ) ++ & posStateMask); ++ ++ prob = p + IsMatch + (state << kNumPosBitsMax) + posState; ++ IfBit0(prob) ++ { ++ int symbol = 1; ++ UpdateBit0(prob) ++ prob = p + Literal + (LZMA_LIT_SIZE * ++ ((( ++ (nowPos ++ #ifdef _LZMA_OUT_READ ++ + globalPos ++ #endif ++ ) ++ & literalPosMask) << lc) + (previousByte >> (8 - lc)))); ++ ++ if (state >= kNumLitStates) ++ { ++ int matchByte; ++ #ifdef _LZMA_OUT_READ ++ UInt32 pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ matchByte = dictionary[pos]; ++ #else ++ matchByte = outStream[nowPos - rep0]; ++ #endif ++ do ++ { ++ int bit; ++ CProb *probLit; ++ matchByte <<= 1; ++ bit = (matchByte & 0x100); ++ probLit = prob + 0x100 + bit + symbol; ++ RC_GET_BIT2(probLit, symbol, if (bit != 0) break, if (bit == 0) break) ++ } ++ while (symbol < 0x100); ++ } ++ while (symbol < 0x100) ++ { ++ CProb *probLit = prob + symbol; ++ RC_GET_BIT(probLit, symbol) ++ } ++ previousByte = (Byte)symbol; ++ ++ outStream[nowPos++] = previousByte; ++ #ifdef _LZMA_OUT_READ ++ if (distanceLimit < dictionarySize) ++ distanceLimit++; ++ ++ dictionary[dictionaryPos] = previousByte; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ #endif ++ if (state < 4) state = 0; ++ else if (state < 10) state -= 3; ++ else state -= 6; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ prob = p + IsRep + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ rep3 = rep2; ++ rep2 = rep1; ++ rep1 = rep0; ++ state = state < kNumLitStates ? 0 : 3; ++ prob = p + LenCoder; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ prob = p + IsRepG0 + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ prob = p + IsRep0Long + (state << kNumPosBitsMax) + posState; ++ IfBit0(prob) ++ { ++ #ifdef _LZMA_OUT_READ ++ UInt32 pos; ++ #endif ++ UpdateBit0(prob); ++ ++ #ifdef _LZMA_OUT_READ ++ if (distanceLimit == 0) ++ #else ++ if (nowPos == 0) ++ #endif ++ return LZMA_RESULT_DATA_ERROR; ++ ++ state = state < kNumLitStates ? 9 : 11; ++ #ifdef _LZMA_OUT_READ ++ pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ previousByte = dictionary[pos]; ++ dictionary[dictionaryPos] = previousByte; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ #else ++ previousByte = outStream[nowPos - rep0]; ++ #endif ++ outStream[nowPos++] = previousByte; ++ #ifdef _LZMA_OUT_READ ++ if (distanceLimit < dictionarySize) ++ distanceLimit++; ++ #endif ++ ++ continue; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ } ++ } ++ else ++ { ++ UInt32 distance; ++ UpdateBit1(prob); ++ prob = p + IsRepG1 + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ distance = rep1; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ prob = p + IsRepG2 + state; ++ IfBit0(prob) ++ { ++ UpdateBit0(prob); ++ distance = rep2; ++ } ++ else ++ { ++ UpdateBit1(prob); ++ distance = rep3; ++ rep3 = rep2; ++ } ++ rep2 = rep1; ++ } ++ rep1 = rep0; ++ rep0 = distance; ++ } ++ state = state < kNumLitStates ? 8 : 11; ++ prob = p + RepLenCoder; ++ } ++ { ++ int numBits, offset; ++ CProb *probLen = prob + LenChoice; ++ IfBit0(probLen) ++ { ++ UpdateBit0(probLen); ++ probLen = prob + LenLow + (posState << kLenNumLowBits); ++ offset = 0; ++ numBits = kLenNumLowBits; ++ } ++ else ++ { ++ UpdateBit1(probLen); ++ probLen = prob + LenChoice2; ++ IfBit0(probLen) ++ { ++ UpdateBit0(probLen); ++ probLen = prob + LenMid + (posState << kLenNumMidBits); ++ offset = kLenNumLowSymbols; ++ numBits = kLenNumMidBits; ++ } ++ else ++ { ++ UpdateBit1(probLen); ++ probLen = prob + LenHigh; ++ offset = kLenNumLowSymbols + kLenNumMidSymbols; ++ numBits = kLenNumHighBits; ++ } ++ } ++ RangeDecoderBitTreeDecode(probLen, numBits, len); ++ len += offset; ++ } ++ ++ if (state < 4) ++ { ++ int posSlot; ++ state += kNumLitStates; ++ prob = p + PosSlot + ++ ((len < kNumLenToPosStates ? len : kNumLenToPosStates - 1) << ++ kNumPosSlotBits); ++ RangeDecoderBitTreeDecode(prob, kNumPosSlotBits, posSlot); ++ if (posSlot >= kStartPosModelIndex) ++ { ++ int numDirectBits = ((posSlot >> 1) - 1); ++ rep0 = (2 | ((UInt32)posSlot & 1)); ++ if (posSlot < kEndPosModelIndex) ++ { ++ rep0 <<= numDirectBits; ++ prob = p + SpecPos + rep0 - posSlot - 1; ++ } ++ else ++ { ++ numDirectBits -= kNumAlignBits; ++ do ++ { ++ RC_NORMALIZE ++ Range >>= 1; ++ rep0 <<= 1; ++ if (Code >= Range) ++ { ++ Code -= Range; ++ rep0 |= 1; ++ } ++ } ++ while (--numDirectBits != 0); ++ prob = p + Align; ++ rep0 <<= kNumAlignBits; ++ numDirectBits = kNumAlignBits; ++ } ++ { ++ int i = 1; ++ int mi = 1; ++ do ++ { ++ CProb *prob3 = prob + mi; ++ RC_GET_BIT2(prob3, mi, ; , rep0 |= i); ++ i <<= 1; ++ } ++ while(--numDirectBits != 0); ++ } ++ } ++ else ++ rep0 = posSlot; ++ if (++rep0 == (UInt32)(0)) ++ { ++ /* it's for stream version */ ++ len = kLzmaStreamWasFinishedId; ++ break; ++ } ++ } ++ ++ len += kMatchMinLen; ++ #ifdef _LZMA_OUT_READ ++ if (rep0 > distanceLimit) ++ #else ++ if (rep0 > nowPos) ++ #endif ++ return LZMA_RESULT_DATA_ERROR; ++ ++ #ifdef _LZMA_OUT_READ ++ if (dictionarySize - distanceLimit > (UInt32)len) ++ distanceLimit += len; ++ else ++ distanceLimit = dictionarySize; ++ #endif ++ ++ do ++ { ++ #ifdef _LZMA_OUT_READ ++ UInt32 pos = dictionaryPos - rep0; ++ if (pos >= dictionarySize) ++ pos += dictionarySize; ++ previousByte = dictionary[pos]; ++ dictionary[dictionaryPos] = previousByte; ++ if (++dictionaryPos == dictionarySize) ++ dictionaryPos = 0; ++ #else ++ previousByte = outStream[nowPos - rep0]; ++ #endif ++ len--; ++ outStream[nowPos++] = previousByte; ++ } ++ while(len != 0 && nowPos < outSize); ++ } ++ } ++ RC_NORMALIZE; ++ ++ #ifdef _LZMA_OUT_READ ++ vs->Range = Range; ++ vs->Code = Code; ++ vs->DictionaryPos = dictionaryPos; ++ vs->GlobalPos = globalPos + (UInt32)nowPos; ++ vs->DistanceLimit = distanceLimit; ++ vs->Reps[0] = rep0; ++ vs->Reps[1] = rep1; ++ vs->Reps[2] = rep2; ++ vs->Reps[3] = rep3; ++ vs->State = state; ++ vs->RemainLen = len; ++ vs->TempDictionary[0] = tempDictionary[0]; ++ #endif ++ ++ #ifdef _LZMA_IN_CB ++ vs->Buffer = Buffer; ++ vs->BufferLim = BufferLim; ++ #else ++ *inSizeProcessed = (SizeT)(Buffer - inStream); ++ #endif ++ *outSizeProcessed = nowPos; ++ return LZMA_RESULT_OK; ++} +diff --git a/init/LzmaDecode.h b/init/LzmaDecode.h +new file mode 100644 +index 0000000..213062a +--- /dev/null ++++ b/init/LzmaDecode.h +@@ -0,0 +1,131 @@ ++/* ++ LzmaDecode.h ++ LZMA Decoder interface ++ ++ LZMA SDK 4.21 Copyright (c) 1999-2005 Igor Pavlov (2005-06-08) ++ http://www.7-zip.org/ ++ ++ LZMA SDK is licensed under two licenses: ++ 1) GNU Lesser General Public License (GNU LGPL) ++ 2) Common Public License (CPL) ++ It means that you can select one of these two licenses and ++ follow rules of that license. ++ ++ SPECIAL EXCEPTION: ++ Igor Pavlov, as the author of this code, expressly permits you to ++ statically or dynamically link your code (or bind by name) to the ++ interfaces of this file without subjecting your linked code to the ++ terms of the CPL or GNU LGPL. Any modifications or additions ++ to this file, however, are subject to the LGPL or CPL terms. ++*/ ++ ++#ifndef __LZMADECODE_H ++#define __LZMADECODE_H ++ ++/* #define _LZMA_IN_CB */ ++/* Use callback for input data */ ++ ++/* #define _LZMA_OUT_READ */ ++/* Use read function for output data */ ++ ++/* #define _LZMA_PROB32 */ ++/* It can increase speed on some 32-bit CPUs, ++ but memory usage will be doubled in that case */ ++ ++/* #define _LZMA_LOC_OPT */ ++/* Enable local speed optimizations inside code */ ++ ++/* #define _LZMA_SYSTEM_SIZE_T */ ++/* Use system's size_t. You can use it to enable 64-bit sizes supporting*/ ++ ++#ifndef UInt32 ++#ifdef _LZMA_UINT32_IS_ULONG ++#define UInt32 unsigned long ++#else ++#define UInt32 unsigned int ++#endif ++#endif ++ ++#ifndef SizeT ++#ifdef _LZMA_SYSTEM_SIZE_T ++#include <stddef.h> ++#define SizeT size_t ++#else ++#define SizeT UInt32 ++#endif ++#endif ++ ++#ifdef _LZMA_PROB32 ++#define CProb UInt32 ++#else ++#define CProb unsigned short ++#endif ++ ++#define LZMA_RESULT_OK 0 ++#define LZMA_RESULT_DATA_ERROR 1 ++ ++#ifdef _LZMA_IN_CB ++typedef struct _ILzmaInCallback ++{ ++ int (*Read)(void *object, const unsigned char **buffer, SizeT *bufferSize); ++} ILzmaInCallback; ++#endif ++ ++#define LZMA_BASE_SIZE 1846 ++#define LZMA_LIT_SIZE 768 ++ ++#define LZMA_PROPERTIES_SIZE 5 ++ ++typedef struct _CLzmaProperties ++{ ++ int lc; ++ int lp; ++ int pb; ++ #ifdef _LZMA_OUT_READ ++ UInt32 DictionarySize; ++ #endif ++}CLzmaProperties; ++ ++int LzmaDecodeProperties(CLzmaProperties *propsRes, const unsigned char *propsData, int size); ++ ++#define LzmaGetNumProbs(Properties) (LZMA_BASE_SIZE + (LZMA_LIT_SIZE << ((Properties)->lc + (Properties)->lp))) ++ ++#define kLzmaNeedInitId (-2) ++ ++typedef struct _CLzmaDecoderState ++{ ++ CLzmaProperties Properties; ++ CProb *Probs; ++ ++ #ifdef _LZMA_IN_CB ++ const unsigned char *Buffer; ++ const unsigned char *BufferLim; ++ #endif ++ ++ #ifdef _LZMA_OUT_READ ++ unsigned char *Dictionary; ++ UInt32 Range; ++ UInt32 Code; ++ UInt32 DictionaryPos; ++ UInt32 GlobalPos; ++ UInt32 DistanceLimit; ++ UInt32 Reps[4]; ++ int State; ++ int RemainLen; ++ unsigned char TempDictionary[4]; ++ #endif ++} CLzmaDecoderState; ++ ++#ifdef _LZMA_OUT_READ ++#define LzmaDecoderInit(vs) { (vs)->RemainLen = kLzmaNeedInitId; } ++#endif ++ ++int LzmaDecode(CLzmaDecoderState *vs, ++ #ifdef _LZMA_IN_CB ++ ILzmaInCallback *inCallback, ++ #else ++ const unsigned char *inStream, SizeT inSize, SizeT *inSizeProcessed, ++ #endif ++ unsigned char *outStream, SizeT outSize, SizeT *outSizeProcessed); ++ ++#endif +diff --git a/init/do_mounts_rd.c b/init/do_mounts_rd.c +index ed652f4..5fd1ec5 100644 +--- a/init/do_mounts_rd.c ++++ b/init/do_mounts_rd.c +@@ -5,7 +5,9 @@ + #include <linux/ext2_fs.h> + #include <linux/romfs_fs.h> + #include <linux/cramfs_fs.h> ++#include <linux/squashfs_fs.h> + #include <linux/initrd.h> ++#include <linux/vmalloc.h> + #include <linux/string.h> + + #include "do_mounts.h" +@@ -31,6 +33,9 @@ static int __init ramdisk_start_setup(char *str) + __setup("ramdisk_start=", ramdisk_start_setup); + + static int __init crd_load(int in_fd, int out_fd); ++#ifdef CONFIG_LZMA_INITRD ++static int __init lzma_rd_load(int in_fd, int out_fd); ++#endif + + /* + * This routine tries to find a RAM disk image to load, and returns the +@@ -39,6 +44,7 @@ static int __init crd_load(int in_fd, int out_fd); + * numbers could not be found. + * + * We currently check for the following magic numbers: ++ * squashfs + * minix + * ext2 + * romfs +@@ -53,6 +59,7 @@ identify_ramdisk_image(int fd, int start_block) + struct ext2_super_block *ext2sb; + struct romfs_super_block *romfsb; + struct cramfs_super *cramfsb; ++ struct squashfs_super_block *squashfsb; + int nblocks = -1; + unsigned char *buf; + +@@ -64,6 +71,7 @@ identify_ramdisk_image(int fd, int start_block) + ext2sb = (struct ext2_super_block *) buf; + romfsb = (struct romfs_super_block *) buf; + cramfsb = (struct cramfs_super *) buf; ++ squashfsb = (struct squashfs_super_block *) buf; + memset(buf, 0xe5, size); + + /* +@@ -82,6 +90,17 @@ identify_ramdisk_image(int fd, int start_block) + nblocks = 0; + goto done; + } ++ /* ++ * handle lzma compressed initrd, returns nblocks=1 as indication ++ */ ++ if( buf[0] < 9 * 5 * 5 && buf[9] == 0 && buf[10] == 0 && buf[11] == 0 ++ && buf[12] == 0 ) ++ { ++ printk( KERN_NOTICE "RAMDISK: LZMA image found at block %d\n", ++ start_block); ++ nblocks = 1; // just a convenient return flag ++ goto done; ++ } + + /* romfs is at block zero too */ + if (romfsb->word0 == ROMSB_WORD0 && +@@ -101,6 +120,18 @@ identify_ramdisk_image(int fd, int start_block) + goto done; + } + ++ /* squashfs is at block zero too */ ++ if (squashfsb->s_magic == SQUASHFS_MAGIC) { ++ printk(KERN_NOTICE ++ "RAMDISK: squashfs filesystem found at block %d\n", ++ start_block); ++ if (squashfsb->s_major < 3) ++ nblocks = (squashfsb->bytes_used_2+BLOCK_SIZE-1)>>BLOCK_SIZE_BITS; ++ else ++ nblocks = (squashfsb->bytes_used+BLOCK_SIZE-1)>>BLOCK_SIZE_BITS; ++ goto done; ++ } ++ + /* + * Read block 1 to test for minix and ext2 superblock + */ +@@ -172,7 +203,22 @@ int __init rd_load_image(char *from) + #endif + goto done; + } +- ++#ifdef CONFIG_LZMA_INITRD ++ /* ++ * handle lzma compressed image ++ */ ++ if ( nblocks == 1 ) ++ { ++ nblocks = 0; ++ if ( lzma_rd_load(in_fd, out_fd) == 0 ) ++ { ++ printk("\nLZMA initrd loaded successfully\n"); ++ goto successful_load; ++ } ++ printk(KERN_NOTICE "LZMA initrd is not in the correct format\n"); ++ goto done; ++ } ++#endif + /* + * NOTE NOTE: nblocks is not actually blocks but + * the number of kibibytes of data to load into a ramdisk. +@@ -393,6 +439,134 @@ static void __init error(char *x) + unzip_error = 1; + } + ++#ifdef CONFIG_LZMA_INITRD ++#define _LZMA_IN_CB ++#define _LZMA_OUT_READ ++#include "LzmaDecode.h" ++#include "LzmaDecode.c" ++ ++static int read_byte(void *object, const unsigned char **buffer, SizeT *bufferSize); ++ ++/* ++ * Do the lzma decompression ++ */ ++static int __init lzma_rd_load(int in_fd, int out_fd) ++{ ++ unsigned int i; ++ CLzmaDecoderState state; ++ unsigned char* outputbuffer; ++ unsigned int uncompressedSize = 0; ++ unsigned char* p; ++ unsigned int kBlockSize = 0x10000; ++ unsigned int nowPos = 0; ++ unsigned int outsizeProcessed = 0; ++ int res; ++ ILzmaInCallback callback; ++ ++ insize = 0; /* valid bytes in inbuf */ ++ inptr = 0; /* index of next byte to be processed in inbuf */ ++ exit_code = 0; ++ crd_infd = in_fd; ++ inbuf = kmalloc(INBUFSIZ, GFP_KERNEL); ++ if (inbuf == 0) ++ { ++ printk(KERN_ERR "RAMDISK: Couldn't allocate lzma input buffer\n"); ++ return -1; ++ } ++ ++ callback.Read = read_byte; ++ ++ /* lzma args */ ++ i = get_byte(); ++ state.Properties.lc = i % 9, i = i / 9; ++ state.Properties.lp = i % 5, state.Properties.pb = i / 5; ++ ++ /* read dictionary size */ ++ p = (char*)&state.Properties.DictionarySize; ++ for (i = 0; i < 4; i++) ++ *p++ = get_byte(); ++ ++ /* get uncompressedSize */ ++ p= (char*)&uncompressedSize; ++ for (i = 0; i < 4; i++) ++ *p++ = get_byte(); ++ ++ /* skip big file */ ++ for (i = 0; i < 4; i++) ++ get_byte(); ++ ++ printk( KERN_NOTICE "RAMDISK: LZMA lc=%d,lp=%d,pb=%d,dictSize=%d,origSize=%d\n", ++ state.Properties.lc, state.Properties.lp, state.Properties.pb, state.Properties.DictionarySize, uncompressedSize); ++ outputbuffer = kmalloc(kBlockSize, GFP_KERNEL); ++ if (outputbuffer == 0) { ++ printk(KERN_ERR "RAMDISK: Couldn't allocate lzma output buffer\n"); ++ return -1; ++ } ++ ++ state.Probs = (CProb*)kmalloc( LzmaGetNumProbs(&state.Properties)*sizeof(CProb), GFP_KERNEL); ++ if ( state.Probs == 0) { ++ printk(KERN_ERR "RAMDISK: Couldn't allocate lzma workspace\n"); ++ return -1; ++ } ++ ++#ifdef CONFIG_LZMA_INITRD_KMALLOC_ONLY ++ state.Dictionary = kmalloc( state.Properties.DictionarySize, GFP_KERNEL); ++#else ++ state.Dictionary = vmalloc( state.Properties.DictionarySize); ++#endif ++ if ( state.Dictionary == 0) { ++ printk(KERN_ERR "RAMDISK: Couldn't allocate lzma dictionary\n"); ++ return -1; ++ } ++ ++ printk( KERN_NOTICE "LZMA initrd by Ming-Ching Tiew <mctiew@yahoo.com> " ); ++ ++ LzmaDecoderInit( &state ); ++ ++ for( nowPos =0; nowPos < uncompressedSize ; ) ++ { ++ UInt32 blockSize = uncompressedSize - nowPos; ++ if( blockSize > kBlockSize) ++ blockSize = kBlockSize; ++ res = LzmaDecode( &state, &callback, outputbuffer, blockSize, &outsizeProcessed); ++ if( res != 0 ) { ++ printk( KERN_ERR "RAMDISK: Lzma decode failure\n"); ++ return -1; ++ } ++ if( outsizeProcessed == 0 ) ++ { ++ uncompressedSize = nowPos; ++ printk( KERN_NOTICE "RAMDISK nowPos=%d, uncompressedSize=%d\n", ++ nowPos, uncompressedSize ); ++ break; ++ } ++ sys_write(out_fd, outputbuffer, outsizeProcessed ); ++ nowPos += outsizeProcessed; ++ printk( "."); ++ } ++ ++#ifdef CONFIG_LZMA_INITRD_KMALLOC_ONLY ++ kfree(state.Dictionary); ++#else ++ vfree(state.Dictionary); ++#endif ++ kfree(inbuf); ++ kfree(outputbuffer); ++ kfree(state.Probs); ++ return 0; ++} ++ ++static int read_byte(void *object, const unsigned char **buffer, SizeT *bufferSize) ++{ ++ static unsigned char val; ++ *bufferSize = 1; ++ val = get_byte(); ++ *buffer = &val; ++ return LZMA_RESULT_OK; ++} ++ ++#endif /*CONFIG_LZMA_INITRD*/ ++ + static int __init crd_load(int in_fd, int out_fd) + { + int result; +diff --git a/init/initramfs.c b/init/initramfs.c +index 00eff7a..30d32a2 100644 +--- a/init/initramfs.c ++++ b/init/initramfs.c +@@ -6,6 +6,7 @@ + #include <linux/delay.h> + #include <linux/string.h> + #include <linux/syscalls.h> ++#include <linux/vmalloc.h> + + static __initdata char *message; + static void __init error(char *x) +@@ -441,6 +442,118 @@ static void __init flush_window(void) + outcnt = 0; + } + ++#ifdef CONFIG_LZMA_INITRAM_FS ++#define _LZMA_IN_CB ++#define _LZMA_OUT_READ ++#include "LzmaDecode.h" ++#ifndef CONFIG_LZMA_INITRD ++ #include "LzmaDecode.c" ++#endif ++static int read_byte(void *object, const unsigned char **buffer, SizeT *bufferSize) ++{ ++ static unsigned char val; ++ *bufferSize = 1; ++ val = get_byte(); ++ *buffer = &val; ++ return LZMA_RESULT_OK; ++} ++ ++static int __init lzma_unzip(void) ++{ ++ unsigned int i; ++ CLzmaDecoderState state; ++ unsigned char* outputbuffer; ++ unsigned int uncompressedSize = 0; ++ unsigned char* p; ++ unsigned int kBlockSize = 0x10000; ++ unsigned int nowPos = 0; ++ unsigned int outsizeProcessed = 0; ++ int res; ++ ILzmaInCallback callback; ++ ++ callback.Read = read_byte; ++ ++ // lzma args ++ i = get_byte(); ++ state.Properties.lc = i % 9, i = i / 9; ++ state.Properties.lp = i % 5, state.Properties.pb = i / 5; ++ ++ // read dictionary size ++ p = (char*)&state.Properties.DictionarySize; ++ for (i = 0; i < 4; i++) ++ *p++ = get_byte(); ++ ++ // get uncompressedSize ++ p= (char*)&uncompressedSize; ++ for (i = 0; i < 4; i++) ++ *p++ = get_byte(); ++ ++ // skip big file ++ for (i = 0; i < 4; i++) ++ get_byte(); ++ ++ printk( KERN_NOTICE "initramfs: LZMA lc=%d,lp=%d,pb=%d,dictSize=%d,origSize=%d\n", ++ state.Properties.lc,state.Properties.lp,state.Properties.pb,state.Properties.DictionarySize, uncompressedSize); ++ outputbuffer = kmalloc(kBlockSize, GFP_KERNEL); ++ if (outputbuffer == 0) { ++ printk(KERN_ERR "initramfs: Couldn't allocate lzma output buffer\n"); ++ return -1; ++ } ++ ++ state.Probs = (CProb*) kmalloc( LzmaGetNumProbs(&state.Properties)*sizeof(CProb), GFP_KERNEL); ++ if ( state.Probs == 0) { ++ printk(KERN_ERR "initramfs: Couldn't allocate lzma workspace\n"); ++ return -1; ++ } ++ ++#ifdef CONFIG_LZMA_INITRAM_FS_KMALLOC_ONLY ++ state.Dictionary = kmalloc( state.Properties.DictionarySize, GFP_KERNEL); ++#else ++ state.Dictionary = vmalloc( state.Properties.DictionarySize); ++#endif ++ if ( state.Dictionary == 0) { ++ printk(KERN_ERR "initramfs: Couldn't allocate lzma dictionary\n"); ++ return -1; ++ } ++ ++ printk( KERN_NOTICE "LZMA initramfs by Ming-Ching Tiew <mctiew@yahoo.com> " ); ++ ++ LzmaDecoderInit( &state ); ++ ++ for( nowPos =0; nowPos < uncompressedSize ; ) ++ { ++ UInt32 blockSize = uncompressedSize - nowPos; ++ if( blockSize > kBlockSize) ++ blockSize = kBlockSize; ++ res = LzmaDecode( &state, &callback, outputbuffer, blockSize, &outsizeProcessed); ++ if( res != 0 ) { ++ panic( KERN_ERR "initramfs: Lzma decode failure\n"); ++ return -1; ++ } ++ if( outsizeProcessed == 0 ) ++ { ++ uncompressedSize = nowPos; ++ printk( KERN_NOTICE "initramfs: nowPos=%d, uncompressedSize=%d\n", ++ nowPos, uncompressedSize ); ++ break; ++ } ++ flush_buffer(outputbuffer, outsizeProcessed); ++ nowPos += outsizeProcessed; ++ printk( "."); ++ } ++ ++#ifdef CONFIG_LZMA_INITRAM_FS_KMALLOC_ONLY ++ kfree(state.Dictionary); ++#else ++ vfree(state.Dictionary); ++#endif ++ kfree(outputbuffer); ++ kfree(state.Probs); ++ return 0; ++} ++ ++#endif /*CONFIG LZMA_INITRAM_FS*/ ++ + static char * __init unpack_to_rootfs(char *buf, unsigned len, int check_only) + { + int written; +@@ -475,12 +588,31 @@ static char * __init unpack_to_rootfs(char *buf, unsigned len, int check_only) + inptr = 0; + outcnt = 0; /* bytes in output buffer */ + bytes_out = 0; +- crc = (ulg)0xffffffffL; /* shift register contents */ +- makecrc(); +- gunzip(); +- if (state != Reset) ++ if( inbuf[0] == 037 && ((inbuf[1] == 0213) || (inbuf[1] == 0236))) ++ { ++ printk( KERN_NOTICE "detected gzip initramfs\n"); ++ crc = (ulg)0xffffffffL; /* shift register contents */ ++ makecrc(); ++ gunzip(); ++ if (state != Reset) + error("junk in gzipped archive"); +- this_header = saved_offset + inptr; ++ } ++#ifdef CONFIG_LZMA_INITRAM_FS ++ else if( inbuf[0] < 9 * 5 * 5 && buf[9] == 0 && buf[10] == 0 ++ && buf[11] == 0 && buf[12] == 0 ) ++ { ++ printk( KERN_NOTICE "detected lzma initramfs\n"); ++ lzma_unzip(); ++ } ++#endif ++ else ++ { ++ // skip forward ? ++ crc = (ulg)0xffffffffL; /* shift register contents */ ++ makecrc(); ++ gunzip(); ++ } ++ this_header = saved_offset + inptr; + buf += inptr; + len -= inptr; + } +diff --git a/kernel/Makefile b/kernel/Makefile +index ac6b27a..bd498a2 100644 +--- a/kernel/Makefile ++++ b/kernel/Makefile +@@ -66,7 +66,7 @@ $(obj)/configs.o: $(obj)/config_data.h + # config_data.h contains the same information as ikconfig.h but gzipped. + # Info from config_data can be extracted from /proc/config* + targets += config_data.gz +-$(obj)/config_data.gz: .config FORCE ++$(obj)/config_data.gz: .miniconfig FORCE + $(call if_changed,gzip) + + quiet_cmd_ikconfiggz = IKCFG $@ +diff --git a/kernel/configs.c b/kernel/configs.c +index 8fa1fb2..c8407eb 100644 +--- a/kernel/configs.c ++++ b/kernel/configs.c +@@ -88,7 +88,7 @@ static int __init ikconfig_init(void) + struct proc_dir_entry *entry; + + /* create the current config file */ +- entry = create_proc_entry("config.gz", S_IFREG | S_IRUGO, ++ entry = create_proc_entry("miniconfig.gz", S_IFREG | S_IRUGO, + &proc_root); + if (!entry) + return -ENOMEM; +@@ -104,7 +104,7 @@ static int __init ikconfig_init(void) + + static void __exit ikconfig_cleanup(void) + { +- remove_proc_entry("config.gz", &proc_root); ++ remove_proc_entry("miniconfig.gz", &proc_root); + } + + module_init(ikconfig_init); +diff --git a/kernel/time/clocksource.c b/kernel/time/clocksource.c +index fe5c7db..a5150e6 100644 +--- a/kernel/time/clocksource.c ++++ b/kernel/time/clocksource.c +@@ -85,8 +85,8 @@ static void clocksource_ratewd(struct clocksource *cs, int64_t delta) + if (delta > -WATCHDOG_TRESHOLD && delta < WATCHDOG_TRESHOLD) + return; + +- printk(KERN_WARNING "Clocksource %s unstable (delta = %Ld ns)\n", +- cs->name, delta); ++/* printk(KERN_WARNING "Clocksource %s unstable (delta = %Ld ns)\n", ++ cs->name, delta); */ + cs->flags &= ~(CLOCK_SOURCE_VALID_FOR_HRES | CLOCK_SOURCE_WATCHDOG); + clocksource_change_rating(cs, 0); + cs->flags &= ~CLOCK_SOURCE_WATCHDOG; +diff --git a/kernel/timer.c b/kernel/timer.c +index dd6c2c1..3a8f485 100644 +--- a/kernel/timer.c ++++ b/kernel/timer.c +@@ -916,8 +916,8 @@ static void change_clocksource(void) + + tick_clock_notify(); + +- printk(KERN_INFO "Time: %s clocksource has been installed.\n", +- clock->name); ++/* printk(KERN_INFO "Time: %s clocksource has been installed.\n", ++ clock->name); */ + } + #else + static inline void change_clocksource(void) { } +diff --git a/miniconfig.sh b/miniconfig.sh +new file mode 100755 +index 0000000..28e7433 +--- /dev/null ++++ b/miniconfig.sh +@@ -0,0 +1,2 @@ ++#!/bin/sh -f ++make allnoconfig KCONFIG_ALLCONFIG=.miniconfig +diff --git a/scripts/Makefile.lib b/scripts/Makefile.lib +index fc498fe..e98172c 100644 +--- a/scripts/Makefile.lib ++++ b/scripts/Makefile.lib +@@ -162,4 +162,9 @@ cmd_objcopy = $(OBJCOPY) $(OBJCOPYFLAGS) $(OBJCOPYFLAGS_$(@F)) $< $@ + quiet_cmd_gzip = GZIP $@ + cmd_gzip = gzip -f -9 < $< > $@ + ++# LZMA ++# ++quiet_cmd_lzma = LZMA $@ ++cmd_lzma = lzma e $< $@ -lc7 -lp0 -pb0 2>/dev/null ++ + +diff --git a/scripts/gen_lzma_initramfs_list.sh b/scripts/gen_lzma_initramfs_list.sh +new file mode 100644 +index 0000000..be3ed6a +--- /dev/null ++++ b/scripts/gen_lzma_initramfs_list.sh +@@ -0,0 +1,292 @@ ++#!/bin/bash ++# Copyright (C) Martin Schlemmer <azarah@nosferatu.za.org> ++# Copyright (c) 2006 Sam Ravnborg <sam@ravnborg.org> ++# ++# Released under the terms of the GNU GPL ++# ++# Generate a cpio packed initramfs. It uses gen_init_cpio to generate ++# the cpio archive, and gzip to pack it. ++# The script may also be used to generate the inputfile used for gen_init_cpio ++# This script assumes that gen_init_cpio is located in usr/ directory ++ ++# error out on errors ++set -e ++ ++usage() { ++cat << EOF ++Usage: ++$0 [-o <file>] [-u <uid>] [-g <gid>] { -s | -d | <cpio_source>} ... ++ -o <file> Create lzma initramfs file named <file> using ++ gen_init_cpio and lzma ++ -u <uid> User ID to map to user ID 0 (root). ++ <uid> is only meaningful if <cpio_source> ++ is a directory. ++ -g <gid> Group ID to map to group ID 0 (root). ++ <gid> is only meaningful if <cpio_source> ++ is a directory. ++ <cpio_source> File list or directory for cpio archive. ++ If <cpio_source> is a .cpio file it will be used ++ as direct input to initramfs. ++ -s Create lzma file with small dictionary size ++ -d Output the default cpio list. ++ ++All options except -o and -l may be repeated and are interpreted ++sequentially and immediately. -u and -g states are preserved across ++<cpio_source> options so an explicit "-u 0 -g 0" is required ++to reset the root/group mapping. ++EOF ++} ++ ++list_default_initramfs() { ++ # echo usr/kinit/kinit ++ : ++} ++ ++default_initramfs() { ++ cat <<-EOF >> ${output} ++ # This is a very simple, default initramfs ++ ++ dir /dev 0755 0 0 ++ nod /dev/console 0600 0 0 c 5 1 ++ dir /root 0700 0 0 ++ # file /kinit usr/kinit/kinit 0755 0 0 ++ # slink /init kinit 0755 0 0 ++ EOF ++} ++ ++filetype() { ++ local argv1="$1" ++ ++ # symlink test must come before file test ++ if [ -L "${argv1}" ]; then ++ echo "slink" ++ elif [ -f "${argv1}" ]; then ++ echo "file" ++ elif [ -d "${argv1}" ]; then ++ echo "dir" ++ elif [ -b "${argv1}" -o -c "${argv1}" ]; then ++ echo "nod" ++ elif [ -p "${argv1}" ]; then ++ echo "pipe" ++ elif [ -S "${argv1}" ]; then ++ echo "sock" ++ else ++ echo "invalid" ++ fi ++ return 0 ++} ++ ++list_print_mtime() { ++ : ++} ++ ++print_mtime() { ++ local my_mtime="0" ++ ++ if [ -e "$1" ]; then ++ my_mtime=$(find "$1" -printf "%T@\n" | sort -r | head -n 1) ++ fi ++ ++ echo "# Last modified: ${my_mtime}" >> ${output} ++ echo "" >> ${output} ++} ++ ++list_parse() { ++ echo "$1 \\" ++} ++ ++# for each file print a line in following format ++# <filetype> <name> <path to file> <octal mode> <uid> <gid> ++# for links, devices etc the format differs. See gen_init_cpio for details ++parse() { ++ local location="$1" ++ local name="${location/${srcdir}//}" ++ # change '//' into '/' ++ name="${name//\/\///}" ++ local mode="$2" ++ local uid="$3" ++ local gid="$4" ++ local ftype=$(filetype "${location}") ++ # remap uid/gid to 0 if necessary ++ [ "$uid" -eq "$root_uid" ] && uid=0 ++ [ "$gid" -eq "$root_gid" ] && gid=0 ++ local str="${mode} ${uid} ${gid}" ++ ++ [ "${ftype}" == "invalid" ] && return 0 ++ [ "${location}" == "${srcdir}" ] && return 0 ++ ++ case "${ftype}" in ++ "file") ++ str="${ftype} ${name} ${location} ${str}" ++ ;; ++ "nod") ++ local dev_type= ++ local maj=$(LC_ALL=C ls -l "${location}" | \ ++ gawk '{sub(/,/, "", $5); print $5}') ++ local min=$(LC_ALL=C ls -l "${location}" | \ ++ gawk '{print $6}') ++ ++ if [ -b "${location}" ]; then ++ dev_type="b" ++ else ++ dev_type="c" ++ fi ++ str="${ftype} ${name} ${str} ${dev_type} ${maj} ${min}" ++ ;; ++ "slink") ++ local target=$(LC_ALL=C ls -l "${location}" | \ ++ gawk '{print $11}') ++ str="${ftype} ${name} ${target} ${str}" ++ ;; ++ *) ++ str="${ftype} ${name} ${str}" ++ ;; ++ esac ++ ++ echo "${str}" >> ${output} ++ ++ return 0 ++} ++ ++unknown_option() { ++ printf "ERROR: unknown option \"$arg\"\n" >&2 ++ printf "If the filename validly begins with '-', " >&2 ++ printf "then it must be prefixed\n" >&2 ++ printf "by './' so that it won't be interpreted as an option." >&2 ++ printf "\n" >&2 ++ usage >&2 ++ exit 1 ++} ++ ++list_header() { ++ : ++} ++ ++header() { ++ printf "\n#####################\n# $1\n" >> ${output} ++} ++ ++# process one directory (incl sub-directories) ++dir_filelist() { ++ ${dep_list}header "$1" ++ ++ srcdir=$(echo "$1" | sed -e 's://*:/:g') ++ dirlist=$(find "${srcdir}" -printf "%p %m %U %G\n" 2>/dev/null) ++ ++ # If $dirlist is only one line, then the directory is empty ++ if [ "$(echo "${dirlist}" | wc -l)" -gt 1 ]; then ++ ${dep_list}print_mtime "$1" ++ ++ echo "${dirlist}" | \ ++ while read x; do ++ ${dep_list}parse ${x} ++ done ++ fi ++} ++ ++# if only one file is specified and it is .cpio file then use it direct as fs ++# if a directory is specified then add all files in given direcotry to fs ++# if a regular file is specified assume it is in gen_initramfs format ++input_file() { ++ source="$1" ++ if [ -f "$1" ]; then ++ ${dep_list}header "$1" ++ is_cpio="$(echo "$1" | sed 's/^.*\.cpio/cpio/')" ++ if [ $2 -eq 0 -a ${is_cpio} == "cpio" ]; then ++ cpio_file=$1 ++ [ ! -z ${dep_list} ] && echo "$1" ++ return 0 ++ fi ++ if [ -z ${dep_list} ]; then ++ print_mtime "$1" >> ${output} ++ cat "$1" >> ${output} ++ else ++ cat "$1" | while read type dir file perm ; do ++ if [ "$type" == "file" ]; then ++ echo "$file \\"; ++ fi ++ done ++ fi ++ elif [ -d "$1" ]; then ++ dir_filelist "$1" ++ else ++ echo " ${prog}: Cannot open '$1'" >&2 ++ exit 1 ++ fi ++} ++ ++prog=$0 ++root_uid=0 ++root_gid=0 ++dep_list= ++cpio_file= ++cpio_list= ++output="/dev/stdout" ++output_file="" ++opt="" ++ ++arg="$1" ++case "$arg" in ++ "-l") # files included in initramfs - used by kbuild ++ dep_list="list_" ++ echo "deps_initramfs := \\" ++ shift ++ ;; ++ "-o") # generate lzma-ed cpio image named $1 ++ shift ++ output_file="$1" ++ cpio_list="$(mktemp ${TMPDIR:-/tmp}/cpiolist.XXXXXX)" ++ output=${cpio_list} ++ shift ++ ;; ++esac ++while [ $# -gt 0 ]; do ++ arg="$1" ++ shift ++ case "$arg" in ++ "-u") # map $1 to uid=0 (root) ++ root_uid="$1" ++ shift ++ ;; ++ "-g") # map $1 to gid=0 (root) ++ root_gid="$1" ++ shift ++ ;; ++ "-s") ++ opt="-d16" ++ ;; ++ "-d") # display default initramfs list ++ default_list="$arg" ++ ${dep_list}default_initramfs ++ ;; ++ "-h") ++ usage ++ exit 0 ++ ;; ++ *) ++ case "$arg" in ++ "-"*) ++ unknown_option ++ ;; ++ *) # input file/dir - process it ++ input_file "$arg" "$#" ++ ;; ++ esac ++ ;; ++ esac ++done ++ ++# If output_file is set we will generate cpio archive and lzma it ++# we are carefull to delete tmp files ++if [ ! -z ${output_file} ]; then ++ if [ -z ${cpio_file} ]; then ++ cpio_tfile="$(mktemp ${TMPDIR:-/tmp}/cpiofile.XXXXXX)" ++ usr/gen_init_cpio ${cpio_list} > ${cpio_tfile} ++ else ++ cpio_tfile=${cpio_file} ++ fi ++ rm ${cpio_list} ++ lzma e ${cpio_tfile} ${output_file} ${opt} ++ [ -z ${cpio_file} ] && rm ${cpio_tfile} ++fi ++exit 0 +diff --git a/shrinkconfig.sh b/shrinkconfig.sh +new file mode 100755 +index 0000000..e7a3df7 +--- /dev/null ++++ b/shrinkconfig.sh +@@ -0,0 +1,79 @@ ++#! /bin/bash ++ ++# shrinkconfig copyright 2006 by Rob Landley <rob@landley.net> ++# Licensed under the GNU General Public License version 2. ++ ++if [ $# -ne 1 ] ++then ++ echo "Turns current .config into a miniconfig file." ++ echo "Usage: shrinkconfig mini.config" ++ exit 1 ++fi ++ ++if [ ! -f .config ] ++then ++ echo "Need a .config file to shrink." ++ exit 1 ++fi ++LENGTH=$(wc -l < .config) ++ ++OUTPUT="$1" ++cp .config "$OUTPUT" ++if [ $? -ne 0 ] ++then ++ echo "Couldn't create $OUTPUT" ++ exit 1 ++fi ++ ++# If we get interrupted, clean up the mess ++ ++KERNELOUTPUT="" ++ ++function cleanup ++{ ++ echo ++ echo "Interrupted." ++ [ ! -z "$KERNELOUTPUT" ] && rm -rf "$KERNELOUTPUT" ++ rm "$OUTPUT" ++ exit 1 ++} ++ ++trap cleanup HUP INT QUIT TERM ++ ++# Since the "O=" argument to make doesn't work recursively, we need to jump ++# through a few hoops to avoid overwriting the .config that we're shrinking. ++ ++# If we're building out of tree, we'll have absolute paths to source and build ++# directories in the Makefile. ++ ++KERNELSRC=$(sed -n -e 's/KERNELSRC[^/]*:=[^/]*//p' Makefile) ++[ -z "$KERNELSRC" ] && KERNELSRC=$(pwd) ++KERNELOUTPUT=`pwd`/.config.minitemp ++ ++mkdir -p "$KERNELOUTPUT" || exit 1 ++ ++echo "Shrinking .config to $OUTPUT..." ++ ++for I in $(seq 1 $LENGTH) ++do ++ echo -n -e "\r"$I/$LENGTH lines $(wc -c < "$OUTPUT") bytes ++ ++ sed -n "${I}!p" "$OUTPUT" > "$KERNELOUTPUT"/.config.test ++ # Do a config with this file ++ make -C "$KERNELSRC" O="$KERNELOUTPUT" allnoconfig KCONFIG_ALLCONFIG="$KERNELOUTPUT"/.config.test > /dev/null ++ ++ # Compare. The date changes, so expect a small difference each time. ++ D=$(diff "$KERNELOUTPUT"/.config .config | wc -l) ++ if [ $D -eq 4 ] ++ then ++ mv "$KERNELOUTPUT"/.config.test "$OUTPUT" ++ LENGTH=$[$LENGTH-1] ++ else ++ I=$[$I + 1] ++ fi ++done ++ ++rm -rf "$KERNELOUTPUT" ++ ++# One extra echo to preserve status line. ++echo +diff --git a/usr/Makefile b/usr/Makefile +index 201f27f..8e1f6ea 100644 +--- a/usr/Makefile ++++ b/usr/Makefile +@@ -19,6 +19,7 @@ $(obj)/initramfs_data.o: $(obj)/initramfs_data.cpio.gz FORCE + + hostprogs-y := gen_init_cpio + initramfs := $(CONFIG_SHELL) $(srctree)/scripts/gen_initramfs_list.sh ++lzma_initramfs := $(CONFIG_SHELL) $(srctree)/scripts/gen_lzma_initramfs_list.sh + ramfs-input := $(if $(filter-out "",$(CONFIG_INITRAMFS_SOURCE)), \ + $(shell echo $(CONFIG_INITRAMFS_SOURCE)),-d) + ramfs-args := \ +@@ -36,6 +37,14 @@ endif + quiet_cmd_initfs = GEN $@ + cmd_initfs = $(initramfs) -o $@ $(ramfs-args) $(ramfs-input) + ++ifdef CONFIG_LZMA_INITRAM_FS_SMALLMEM ++quiet_cmd_lzma_initfs = LZRAMFS $@ ++ cmd_lzma_initfs = $(lzma_initramfs) -o $@ $(ramfs-args) -s $(ramfs-input) ++else ++quiet_cmd_lzma_initfs = LZRAMFS $@ ++ cmd_lzma_initfs = $(lzma_initramfs) -o $@ $(ramfs-args) $(ramfs-input) ++endif ++ + targets := initramfs_data.cpio.gz + # do not try to update files included in initramfs + $(deps_initramfs): ; +@@ -48,5 +57,9 @@ $(deps_initramfs): klibcdirs + # 4) arguments to gen_initramfs.sh changes + $(obj)/initramfs_data.cpio.gz: $(obj)/gen_init_cpio $(deps_initramfs) klibcdirs + $(Q)$(initramfs) -l $(ramfs-input) > $(obj)/.initramfs_data.cpio.gz.d ++ifdef CONFIG_LZMA_INITRAM_FS ++ $(call if_changed,lzma_initfs) ++else + $(call if_changed,initfs) ++endif + |