From f579ab7314ada4d49163ebeb58861c04194dc2d4 Mon Sep 17 00:00:00 2001 From: Earl Ou Date: Fri, 12 Oct 2012 14:02:49 +0800 Subject: Exiftool parser This parser parse the output from Phil Harvey's 'exiftool' with -v2 flag and convert it input xml format Change-Id: Iffdb235780697f8c37738937fd4ecaeb1d1127bb --- tests/exiftool_parser/parser.py | 66 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 66 insertions(+) create mode 100755 tests/exiftool_parser/parser.py (limited to 'tests/exiftool_parser/parser.py') diff --git a/tests/exiftool_parser/parser.py b/tests/exiftool_parser/parser.py new file mode 100755 index 000000000..32984886c --- /dev/null +++ b/tests/exiftool_parser/parser.py @@ -0,0 +1,66 @@ +#!/usr/bin/env python +# +# This parser parses the output from Phil Harvey's exiftool (version 9.02) +# and convert it to xml format. It reads exiftool's output from stdin and +# write the xml format to stdout. +# +# In order to get the raw infomation from exiftool, we need to enable the verbose +# flag (-v2) of exiftool. +# +# Usage: +# exiftool -v2 img.jpg | ./parser.py >> output.xml +# +# + +import os +import sys +import re + +text = sys.stdin.read() + +print """""" +print "" + +# find the following two groups of string: +# +# 1. tag: +# +# x) name = value +# - Tag 0x1234 +# +# 2. IFD indicator: +# +# + [xxx directory with xx entries] +# +p = re.compile( + "(^.*?[0-9]\).*? = .*?\n.*?- Tag 0x[0-9a-f]{4})|(\+ \[.*? directory with [0-9]+ entries]$)" + , re.M) +tags = p.findall(text) + +for s in tags: + if s[1]: + ifd = s[1][3:].split()[0] + else: + s = s[0] + # find the raw value in the parenthesis + p = re.compile("\(.*\)\n") + value = p.search(s) + if value: + value = value.group(0)[1:-2] + else: + p = re.compile("=.*\n") + value = p.search(s) + value = value.group(0)[2:-1] + + # find the ID + p = re.compile("0x[0-9a-f]{4}") + _id = p.search(s) + _id = _id.group(0) + + # find the name + p = re.compile("[0-9]*?\).*? = ") + name = p.search(s) + name = name.group(0)[4:-3] + print (' ' + value + "") +print "" -- cgit v1.2.3