X-Git-Url: http://git.annexia.org/?a=blobdiff_plain;f=src%2Fkallsyms.ml;fp=src%2Fkallsyms.ml;h=8663842edd4c6c5d3042f22f6d895f318d5654c1;hb=5b2d80650c4f01c64452b1aee2f024b25dd22e3f;hp=0000000000000000000000000000000000000000;hpb=3b56c80718ca0eb1dbde633b569f5ca7313cb4be;p=virt-dmesg.git diff --git a/src/kallsyms.ml b/src/kallsyms.ml new file mode 100644 index 0000000..8663842 --- /dev/null +++ b/src/kallsyms.ml @@ -0,0 +1,253 @@ +(* virt-dmesg + * (C) Copyright 2008-2011 Red Hat Inc. + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. + *) + +open Printf + +open Utils + +(* This code tries to find the /proc/kallsyms table. This is in an + * odd compressed format (but not a very successful compression + * format). However if it exists we know that it will contain + * addresses of the ordinary ksyms, and it has some characteristics + * which make it easy to detect in the memory. + * + * kallsyms contains a complete list of symbols so is much more useful + * than the basic list of exports. + *) + +let min_kallsyms_tabsize = 1_000L +let max_kallsyms_tabsize = 1_000_000L (* 433056 kallsyms in 64 bit F14 kernel *) + +type kallsyms_compr = + | Compressed of (string * int64) list * int64 + | Uncompressed of (string * int64) list + +let search_kallsyms k map = + let ksym_addrs = filter_map ( + fun ksym -> try Some (StringMap.find ksym map) with Not_found -> None + ) Ksyms.common_ksyms in + + (* Search for those kernel addresses in the image. We're looking + * for the table kallsyms_addresses followed by kallsyms_num_syms + * (number of symbols in the table). + *) + let ksym_addrs = + List.concat (List.map (Kernel.find_all_pointers k) ksym_addrs) in + + (* Test each one to see if it's a candidate list of kernel + * addresses followed by length of list. + *) + let kallsymtabs = filter_map ( + fun addr -> + (* Search upwards from address until we find the length field. + * If found, jump backwards by length and check all addresses. + *) + debug "testing candidate kallsyms at %Lx" addr; + + (* Addresses which can appear in kallsyms can be validly not + * mapped. This appears to only happen for 64 bit kernels. + *) + let is_kallsyms_valid_address = + match k.Kernel.wordsize with + | Kernel.Word32 -> Kernel.is_mapped k + | Kernel.Word64 -> + fun addr -> + Kernel.is_mapped k addr + || Kernel.addr_compare addr 0xffffffff_ff000000_L >= 0 + || Kernel.addr_compare addr 0x00000000_00020000_L <= 0 + in + + let rec loop prev_addrp addr = + let addrp = Kernel.follow_pointer k addr in + + (* kallsyms are sorted, so this gives us an additional heuristic *) + let increasing = + match prev_addrp with + | None -> true + | Some prev_addrp -> Kernel.addr_compare prev_addrp addrp <= 0 in + + if increasing && is_kallsyms_valid_address addrp then + (* continue up the table *) + loop (Some addrp) (Kernel.succ_word k addr) + else + if addrp >= min_kallsyms_tabsize && + addrp <= max_kallsyms_tabsize then ( + (* addrp might be the symbol count. Count backwards and + * check the full table. + *) + debug "addrp (num_entries) = %Lx" addrp; + + let num_entries = Int64.to_int addrp in + let entry_size = Kernel.bytes_of_wordsize k in + let start_addr = + addr -^ Int64.of_int (entry_size * num_entries) in + let end_addr = addr in + let rec loop2 addr = + if Kernel.addr_compare addr end_addr < 0 then ( + let addrp = Kernel.follow_pointer k addr in + if is_kallsyms_valid_address addrp then + loop2 (Kernel.succ_word k addr) + else ( + debug "rejected on second pass because addrp = %Lx" addrp; + None + ) + ) else + (* ok! *) + let names_addr = Kernel.succ_word k end_addr in + debug "candidate kallsyms found at %Lx (names_addr at %Lx, num_entries %d)" + start_addr names_addr num_entries; + Some (start_addr, num_entries, names_addr) + in + loop2 start_addr + ) + else ( + debug "rejected on first pass because addrp = %Lx" addrp; + None + ) + in + match loop None addr with + | None -> None + | Some (start_addr, num_entries, names_addr) -> + (* As an additional verification, check the list of + * kallsyms_names. + *) + try + (* If the first byte is '\000' and is followed by a + * C identifier, then this is old-school list of + * symbols with prefix compression as in 2.6.9. + * Otherwise Huffman-compressed kallsyms as in + * 2.6.25. + *) + if Kernel.get_byte k names_addr = 0 && + Kernel.is_C_identifier k (names_addr+^1L) then ( + let names = ref [] in + let prev = ref "" in + let rec loop names_addr start_addr num = + if num > 0 then ( + let prefix = Kernel.get_byte k names_addr in + let prefix = String.sub !prev 0 prefix in + let name = + Kernel.get_string k (names_addr+^1L) in + let len = String.length name in + let name = prefix ^ name in + prev := name; + let names_addr = names_addr +^ Int64.of_int len +^ 2L in + let sym_value = Kernel.follow_pointer k start_addr in + let start_addr = Kernel.succ_word k start_addr in + (*eprintf "%S -> %Lx\n" name sym_value;*) + names := (name, sym_value) :: !names; + loop names_addr start_addr (num-1) + ) + in + loop names_addr start_addr num_entries; + let names = List.rev !names in + + Some (start_addr, num_entries, names_addr, + Uncompressed names) + ) + else ( (* new-style "compressed" names. *) + let compressed_names = ref [] in + let rec loop names_addr start_addr num = + if num > 0 then ( + let len = Kernel.get_byte k names_addr in + let name = Kernel.get_memory k (names_addr+^1L) len in + let names_addr = names_addr +^ Int64.of_int len +^ 1L in + let sym_value = Kernel.follow_pointer k start_addr in + let start_addr = Kernel.succ_word k start_addr in + compressed_names := + (name, sym_value) :: !compressed_names; + loop names_addr start_addr (num-1) + ) else + names_addr + in + let markers_addr = loop names_addr start_addr num_entries in + let markers_addr = Kernel.succ_align k markers_addr in + let compressed_names = List.rev !compressed_names in + + Some (start_addr, num_entries, names_addr, + Compressed (compressed_names, markers_addr)) + ) + with + Invalid_argument _ -> None (* bad names list *) + ) ksym_addrs in + + debug "candidate kallsyms at:"; + List.iter ( + function + | (start_addr, num_entries, names_addr, Uncompressed _) -> + debug "\t%Lx %d entries names_addr=%Lx old-style" + start_addr num_entries names_addr + | (start_addr, num_entries, names_addr, + Compressed (_, markers_addr)) -> + debug "\t%Lx %d entries names_addr=%Lx markers_addr=%Lx" + start_addr num_entries names_addr markers_addr + ) kallsymtabs; + + (* Vote for the most popular symbol table candidate and + * return the list of kallsyms. + *) + let freqs = frequency kallsymtabs in + match freqs with + | [] -> + (* Can't find any kallsymtabs. *) + raise Not_found + + | (_, (_, _, _, Uncompressed names)) :: _ -> + names + + | (_, (start_addr, num_entries, names_addr, + Compressed (compressed_names, markers_addr))) :: _ -> + (* Skip the markers and look for the token table. *) + let num_markers = Int64.of_int ((num_entries + 255) / 256) in + let marker_size = Int64.of_int (Kernel.bytes_of_wordsize k) in + let tokens_addr = markers_addr +^ marker_size *^ num_markers in + + (* Now read out the compression tokens, which are just + * 256 ASCIIZ strings that map bytes in the compression + * names to substrings. + *) + let tokens = Array.make 256 "" in + let rec loop i addr = + if i < 256 then ( + let str = Kernel.get_string k addr in + let len = String.length str in + let addr = addr +^ Int64.of_int (len+1) in + tokens.(i) <- str; + loop (i+1) addr + ) + in + loop 0 tokens_addr; + + (* Expand the compressed names using the tokens. *) + filter_map ( + fun (name, sym_value) -> + let f c = tokens.(Char.code c) in + let name = replace_chars f name in + (* First character in uncompressed output is the symbol + * type, eg. 'T'/'t' for text etc. + *) + (* NOTE: Symbol names are NOT unique + * (eg. 'con_start' is both a function and data in + * some kernels). XXX We need to handle this situation + * better. + *) + (*let typ = name.[0] in*) + let name = String.sub name 1 (String.length name - 1) in + (*eprintf "%S -> %Lx\n" name sym_value;*) + Some (name, sym_value) + ) compressed_names