open Diskimage_impl
open Int63.Operators
+let id = "ntfs"
+
+(* Type of the private data, basically all the metadata that we
+ * read from the NTFS volume.
+ *)
+type ntfs_fs = {
+ ntfs_dev : device; (* Device. *)
+ ntfs_blocksize : int63; (* Blocksize (cluster size) *)
+ ntfs_mft_lcn : int63; (* MFT location (bytes) *)
+ ntfs_mft_size : int63; (* MFT size (bytes) *)
+ ntfs_mft_records : ntfs_mft_record list; (* Files in MFT *)
+}
+and ntfs_mft_record = {
+ ntfs_filename : ntfs_filename option; (* Filename, if present. *)
+ ntfs_info : ntfs_info option; (* Standard information, if present. *)
+ ntfs_data : ntfs_data option; (* $Data stream, if present. *)
+}
+and ntfs_filename = {
+ ntfs_name : string; (* Filename (UTF-8 encoded). *)
+}
+and ntfs_info = {
+ ntfs_creation_time : int64;
+ ntfs_last_data_change_time : int64;
+ ntfs_last_mft_change_time : int64;
+ ntfs_last_access_time : int64;
+}
+and ntfs_data = {
+ ntfs_data_size : int63; (* Actual size of data. *)
+ ntfs_runlist : ntfs_runentry list; (* Runlist. *)
+}
+and ntfs_runentry =
+ (* VCN start,size => LCN / None if sparse hole *)
+ (int63 * int63) * int63 option
+
(* Private data functions. *)
let attach_private_data, get_private_data =
private_data_functions (fun {fs_cb = {fs_cb_uq = u}} -> u)
-let id = "ntfs"
-
+(* Probe for an NTFS filesystem on this device. *)
let rec probe dev =
let fs = probe_superblock dev in
fs
dev#name blocksize volume_serial_number;
let blocksize = Int63.of_int blocksize in
+ let number_of_sectors = Int63.of_int64 number_of_sectors in
(* The blocksize of the filesystem is likely to be quite different
* from that of the underlying device, so create an overlay device
let mft = parse_mft dev mft_lcn mft_size in
- raise Not_found (* XXX *)
+ let ntfs = {
+ ntfs_dev = fs_dev;
+ ntfs_blocksize = blocksize;
+ ntfs_mft_lcn = mft_lcn;
+ ntfs_mft_size = mft_size;
+ ntfs_mft_records = mft
+ } in
+
+ (* Query free space. I cannot find any metadata in the NTFS
+ * structures which records free space directly, so instead we
+ * need to read the $Bitmap::$Data (bitmap of allocated LCNs).
+ *)
+ let blocks_used, blocks_avail = parse_bitmap_freespace ntfs in
+
+ (* Create a filesystem structure. *)
+ let fs = {
+ fs_cb = callbacks ();
+ fs_dev = fs_dev;
+ fs_blocksize = blocksize;
+ fs_blocks_total = number_of_sectors *^ bytes_per_sector /^ blocksize;
+ fs_is_swap = false;
+ fs_blocks_reserved = ~^0; (* XXX MFT, bitmap are "reserved" *)
+ fs_blocks_avail = blocks_avail;
+ fs_blocks_used = blocks_used;
+ fs_inodes_total = ~^0; (* XXX MFT records are like inodes *)
+ fs_inodes_reserved = ~^0;
+ fs_inodes_avail = ~^0;
+ fs_inodes_used = ~^0;
+ } in
+
+ attach_private_data fs ntfs;
+ fs
| { _ } -> raise Not_found (* Not an NTFS boot sector. *)
if !debug then
eprintf "got an MFT record, now parsing attributes ...\n%!";
- let attrs = parse_attrs attrs in
+ let mft_record = {
+ ntfs_filename = None;
+ ntfs_info = None;
+ ntfs_data = None
+ } in
+ let mft_record = parse_attrs attrs mft_record in
- parse_mft_records rest (* loop rest of MFT records *)
+ mft_record :: parse_mft_records rest (* loop rest of MFT records *)
(* Just assume that the end of the list of MFT records
* is marked by all zeroes. This seems to be the
* case, but not sure if it is generally true.
* XXX?
*)
- | { 0x00000000_l : 32 } ->
- ()
+ | { 0x00000000_l : 32 } -> []
- | { _ } -> ()
+ | { _ } -> []
-and parse_attrs attrs =
+and parse_attrs attrs mft_record =
(* Parse the MFT record attributes. *)
bitmatch attrs with
| { 0xFFFFFFFF_l : 32 : littleendian } -> (* AT_END *)
if !debug then
eprintf "found AT_END, end of attributes\n%!";
- ()
+ mft_record
| { attr_type : 32 : littleendian;
attr_size : 32 : littleendian;
attr : (Int32.to_int attr_size - 24) * 8 : bitstring;
rest : -1 : bitstring } ->
- (* XXX let attr = *) parse_resident_attr attr_type attr;
- parse_attrs rest
+ let mft_record = parse_resident_attr attr_type attr mft_record in
+ parse_attrs rest mft_record
| { attr_type : 32 : littleendian;
attr_size : 32 : littleendian;
rest : -1 : bitstring } ->
- (* XXX let attr = *)
- parse_nonresident_attr attr_type highest_vcn
- allocated_size data_size initialized_size
- mapping_pairs;
+ let data_size = Int63.of_int64 data_size in
+
+ let mft_record =
+ parse_nonresident_attr attr_type highest_vcn
+ allocated_size data_size initialized_size
+ mapping_pairs mft_record in
- parse_attrs rest
+ parse_attrs rest mft_record
(* Not matched above, so we don't know how to parse this attribute, but
* there is still enough information to skip to the next one.
pad : (Int32.to_int attr_size - 8) * 8 : bitstring;
rest : -1 : bitstring } ->
- if !debug then (
- eprintf "cannot parse MFT attribute entry\n%!";
- Bitmatch.hexdump_bitstring Pervasives.stderr attrs
- );
+ if !debug then
+ eprintf "cannot parse MFT attribute entry, attr_type = %lx\n%!"
+ attr_type;
- parse_attrs rest
+ parse_attrs rest mft_record
(* Otherwise unparsable & unskippable attribute entry. *)
| { _ } ->
if !debug then
- eprintf "corrupt MFT attribute entry\n%!"
+ eprintf "corrupt MFT attribute entry\n%!";
+ mft_record
-and parse_resident_attr attr_type attr =
+and parse_resident_attr attr_type attr mft_record =
match attr_type with
| 0x10_l -> (* AT_STANDARD_INFORMATION *)
(bitmatch attr with
last_mft_change_time : 64;
last_access_time : 64
(* other stuff follows, just ignore it *) } ->
- if !debug then
- eprintf "creation time: %Lx, last_access_time: %Lx\n"
- creation_time last_access_time
+
+ let info = {
+ ntfs_creation_time = creation_time;
+ ntfs_last_data_change_time = last_data_change_time;
+ ntfs_last_mft_change_time = last_mft_change_time;
+ ntfs_last_access_time = last_access_time
+ } in
+ { mft_record with ntfs_info = Some info }
| { _ } ->
if !debug then
- eprintf "cannot parse AT_STANDARD_INFORMATION\n%!"
+ eprintf "cannot parse AT_STANDARD_INFORMATION\n%!";
+ mft_record
);
| 0x30_l -> (* AT_FILE_NAME *)
_ : 64; (* last change time *)
_ : 64; (* last MFT change time *)
_ : 64; (* last access time *)
- allocated_size : 64 : littleendian;
- data_size : 64 : littleendian;
+ _ : 64; (* allocated size *)
+ _ : 64; (* data size *)
_ : 32;
_ : 32;
name_len : 8;
name : name_len*16 : string } ->
let name = ucs2_to_utf8 name name_len in
- if !debug then
- eprintf "filename: %s (size: %Ld bytes)\n" name data_size
+ let filename = {
+ ntfs_name = name
+ } in
+ { mft_record with ntfs_filename = Some filename }
| { _ } ->
if !debug then
- eprintf "cannot parse AT_FILE_NAME\n%!"
+ eprintf "cannot parse AT_FILE_NAME\n%!";
+ mft_record
);
| _ -> (* unknown attribute - just ignore *)
if !debug then
- eprintf "unknown resident attribute %lx\n%!" attr_type
+ eprintf "unknown resident attribute %lx\n%!" attr_type;
+ mft_record
and parse_nonresident_attr attr_type highest_vcn
allocated_size data_size initialized_size
- mapping_pairs =
+ mapping_pairs mft_record =
match attr_type with
| 0x80_l -> (* AT_DATA, ie. the $Data stream *)
- if !debug then (
- eprintf "AT_DATA: size = %Ld bytes, highest_vcn = 0x%Lx\n"
- data_size highest_vcn;
- Bitmatch.hexdump_bitstring Pervasives.stderr mapping_pairs
- );
-
let lowest_vcn = ~^0 (* see assumption above *) in
let runlist = parse_runlist lowest_vcn ~^0 mapping_pairs in
if !debug then (
) runlist
);
+ let data = {
+ ntfs_data_size = data_size;
+ ntfs_runlist = runlist
+ } in
+ { mft_record with ntfs_data = Some data }
+
| _ ->
if !debug then
- eprintf "unknown non-resident attribute %lx\n%!" attr_type
+ eprintf "unknown non-resident attribute %lx\n%!" attr_type;
+ mft_record
(* mapping_pairs is not straightforward and not documented well. See
* ntfsprogs libntfs/runlist.c:ntfs_mapping_pairs_decompress
let lcn = lcn +^ deltalcn in
- eprintf "lcnlen = %d, vcnlen = %d\n" lcnlen vcnlen;
-
((vcn, deltavcn), Some lcn) ::
parse_runlist (vcn +^ deltavcn) lcn rest
done;
outstr
-and offset_is_free _ _ = false
+(* Parse $Bitmap::$Data to get free/used. Returns (used, free) blocks. *)
+and parse_bitmap_freespace ntfs =
+ (* Can throw Not_found - allow that to escape because we don't
+ * expect an NTFS filesystem without this magic file.
+ *)
+ let file = find_system_file ntfs "$Bitmap" in
+
+ (* Count used/free bits. *)
+ let used = ref ~^0 and free = ref ~^0 in
+ iter_blocks ntfs file (
+ fun lcn vcn data ->
+ for i = 0 to String.length data - 1 do
+ let c = Char.code data.[i] in
+ if c = 0 then (* common cases *)
+ free := !free +^ ~^8
+ else if c = 0xff then
+ used := !used +^ ~^8
+ else ( (* uncommon case: count the bits *)
+ let m = ref 0x80 in
+ while !m > 0 do
+ if c land !m <> 0 then
+ used := !used +^ ~^1
+ else
+ free := !free +^ ~^1;
+ m := !m lsr 1
+ done
+ )
+ done
+ );
+ (!used, !free)
+
+and find_system_file { ntfs_mft_records = mft_records } fname =
+ let rec loop =
+ function
+ | [] -> raise Not_found
+ | ({ ntfs_filename = Some { ntfs_name = name } } as file) :: _
+ when name = fname ->
+ file
+ | _ :: rest -> loop rest
+ in
+ loop mft_records
+
+and iter_blocks { ntfs_blocksize = blocksize; ntfs_dev = dev }
+ { ntfs_data = data } f =
+ match data with
+ | None -> () (* No $Data attribute. *)
+ | Some { ntfs_data_size = data_size; ntfs_runlist = runlist } ->
+ let rec loop data_size = function
+ | [] -> ()
+
+ (* Run of vcnsize clusters. *)
+ | ((vcnstart, vcnsize), Some lcn) :: rest ->
+ let data_size = ref data_size in
+ let lcn = ref lcn in
+ let vcn = ref vcnstart in
+ let vcnsize = ref vcnsize in
+ while !vcnsize > ~^0 && !data_size > ~^0 do
+ let size = min blocksize !data_size in
+ let data = dev#read (!lcn *^ blocksize) size in
+ f (Some !lcn) !vcn data;
+ lcn := !lcn +^ ~^1;
+ vcn := !vcn +^ ~^1;
+ vcnsize := !vcnsize -^ ~^1;
+ data_size := !data_size -^ size
+ done;
+ loop !data_size rest
+
+ (* Sparse hole. *)
+ | ((vcnstart, vcnsize), None) :: rest ->
+ let data_size = ref data_size in
+ let vcn = ref vcnstart in
+ let vcnsize = ref vcnsize in
+ while !vcnsize > ~^0 && !data_size > ~^0 do
+ let size = min blocksize !data_size in
+ let data = String.make size '\000' in
+ f None !vcn data;
+ vcn := !vcn +^ ~^1;
+ vcnsize := !vcnsize -^ ~^1;
+ data_size := !data_size -^ size
+ done;
+ loop !data_size rest
+ in
+ loop data_size runlist
+
+(* This is a bit limited at the moment because it can only read from
+ * a contiguous part of the file. System files are usually contiguous
+ * so this is OK for us.
+ *)
+and read_file { ntfs_blocksize = blocksize; ntfs_dev = dev }
+ { ntfs_data = data } offset size =
+ match data with
+ | None -> raise Not_found (* No $Data attribute. *)
+ | Some { ntfs_data_size = data_size; ntfs_runlist = runlist } ->
+ if offset < ~^0 || size < ~^0 || offset +^ size >= data_size then
+ invalid_arg "ntfs: read_file: tried to read outside file";
+
+ (* Get the first and last VCNs containing the data. *)
+ let vcn = offset /^ blocksize in
+ let vcnoffset = offset %^ blocksize in
+ let vcnend = (offset +^ size -^ ~^1) /^ blocksize in
+
+ (* Find the run containing this VCN. *)
+ let rec find = function
+ | [] -> raise Not_found
+ | ((vcnstart, vcnsize), lcn) :: _
+ when vcnstart <= vcn && vcn < vcnstart +^ vcnsize &&
+ vcnstart <= vcnend && vcnend < vcnstart +^ vcnsize ->
+ lcn
+ | _ :: rest -> find rest
+ in
+ let lcn = find runlist in
+
+ (* Read the LCNs. *)
+ let data =
+ match lcn with
+ | Some lcn -> dev#read (lcn *^ blocksize +^ vcnoffset) size
+ | None -> String.make size '\000' (* sparse hole *) in
+ data
+
+(* This is easy: just look at the bitmap. *)
+and offset_is_free fs offset =
+ try
+ let ntfs = get_private_data fs in
+ let blocksize = ntfs.ntfs_blocksize in
+
+ (* Get the $Bitmap file. *)
+ let file = find_system_file ntfs "$Bitmap" in
+
+ let lcn = offset /^ blocksize in
+
+ (* Read the byte in the bitmap corresponding to this LCN. *)
+ let byteoffset = lcn >^> 3 and bitoffset = lcn &^ ~^7 in
+ let byte = read_file ntfs file byteoffset ~^1 in
+ let byte = Char.code byte.[0] in
+ let bit = byte >^> (~^0x80 >^> (Int63.to_int bitoffset)) in
+
+ bit <> ~^0
+ with
+ Not_found -> false (* play it safe *)
and callbacks =
let i = ref 0 in