package exif import ( "bytes" "fmt" "strings" "encoding/binary" "github.com/dsoprea/go-logging" ) var ( ifdEnumerateLogger = log.NewLogger("exifjpeg.ifd") ) // IfdTagEnumerator knows how to decode an IFD and all of the tags it // describes. // // The IFDs and the actual values can float throughout the EXIF block, but the // IFD itself is just a minor header followed by a set of repeating, // statically-sized records. So, the tags (though notnecessarily their values) // are fairly simple to enumerate. type IfdTagEnumerator struct { byteOrder binary.ByteOrder addressableData []byte ifdOffset uint32 buffer *bytes.Buffer } func NewIfdTagEnumerator(addressableData []byte, byteOrder binary.ByteOrder, ifdOffset uint32) (ite *IfdTagEnumerator) { ite = &IfdTagEnumerator{ addressableData: addressableData, byteOrder: byteOrder, buffer: bytes.NewBuffer(addressableData[ifdOffset:]), } return ite } // getUint16 reads a uint16 and advances both our current and our current // accumulator (which allows us to know how far to seek to the beginning of the // next IFD when it's time to jump). func (ife *IfdTagEnumerator) getUint16() (value uint16, raw []byte, err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() raw = make([]byte, 2) _, err = ife.buffer.Read(raw) log.PanicIf(err) if ife.byteOrder == binary.BigEndian { value = binary.BigEndian.Uint16(raw) } else { value = binary.LittleEndian.Uint16(raw) } return value, raw, nil } // getUint32 reads a uint32 and advances both our current and our current // accumulator (which allows us to know how far to seek to the beginning of the // next IFD when it's time to jump). func (ife *IfdTagEnumerator) getUint32() (value uint32, raw []byte, err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() raw = make([]byte, 4) _, err = ife.buffer.Read(raw) log.PanicIf(err) if ife.byteOrder == binary.BigEndian { value = binary.BigEndian.Uint32(raw) } else { value = binary.LittleEndian.Uint32(raw) } return value, raw, nil } type IfdEnumerate struct { exifData []byte buffer *bytes.Buffer byteOrder binary.ByteOrder currentOffset uint32 } func NewIfdEnumerate(exifData []byte, byteOrder binary.ByteOrder) *IfdEnumerate { // Make it obvious what data we expect and when we don't get it. if IsExif(exifData) == false { log.Panicf("not exif data") } return &IfdEnumerate{ exifData: exifData, buffer: bytes.NewBuffer(exifData), byteOrder: byteOrder, } } // ValueContext describes all of the parameters required to find and extract // the actual tag value. type ValueContext struct { UnitCount uint32 ValueOffset uint32 RawValueOffset []byte AddressableData []byte } func (ie *IfdEnumerate) getTagEnumerator(ifdOffset uint32) (ite *IfdTagEnumerator) { ite = NewIfdTagEnumerator( ie.exifData[ExifAddressableAreaStart:], ie.byteOrder, ifdOffset) return ite } func (ie *IfdEnumerate) parseTag(ii IfdIdentity, tagIndex int, ite *IfdTagEnumerator) (tag *IfdTagEntry, err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() tagId, _, err := ite.getUint16() log.PanicIf(err) tagType, _, err := ite.getUint16() log.PanicIf(err) unitCount, _, err := ite.getUint32() log.PanicIf(err) valueOffset, rawValueOffset, err := ite.getUint32() log.PanicIf(err) tag = &IfdTagEntry{ Ii: ii, TagId: tagId, TagIndex: tagIndex, TagType: tagType, UnitCount: unitCount, ValueOffset: valueOffset, RawValueOffset: rawValueOffset, } // If it's an IFD but not a standard one, it'll just be seen as a LONG // (the standard IFD tag type), later, unless we skip it because it's // [likely] not even in the standard list of known tags. childIfdName, isIfd := IfdTagNameWithId(ii.IfdName, tagId) if isIfd == true { tag.ChildIfdName = childIfdName } return tag, nil } // TagVisitor is an optional callback that can get hit for every tag we parse // through. `addressableData` is the byte array startign after the EXIF header // (where the offsets of all IFDs and values are calculated from). type TagVisitor func(ii IfdIdentity, ifdIndex int, tagId uint16, tagType TagType, valueContext ValueContext) (err error) // ParseIfd decodes the IFD block that we're currently sitting on the first // byte of. func (ie *IfdEnumerate) ParseIfd(ii IfdIdentity, ifdIndex int, ite *IfdTagEnumerator, visitor TagVisitor, doDescend bool) (nextIfdOffset uint32, entries []*IfdTagEntry, err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() tagCount, _, err := ite.getUint16() log.PanicIf(err) ifdEnumerateLogger.Debugf(nil, "Current IFD tag-count: (%d)", tagCount) entries = make([]*IfdTagEntry, tagCount) for i := 0; i < int(tagCount); i++ { tag, err := ie.parseTag(ii, i, ite) log.PanicIf(err) if visitor != nil { tt := NewTagType(tag.TagType, ie.byteOrder) vc := ValueContext{ UnitCount: tag.UnitCount, ValueOffset: tag.ValueOffset, RawValueOffset: tag.RawValueOffset, AddressableData: ie.exifData[ExifAddressableAreaStart:], } err := visitor(ii, ifdIndex, tag.TagId, tt, vc) log.PanicIf(err) } // If it's an IFD but not a standard one, it'll just be seen as a LONG // (the standard IFD tag type), later, unless we skip it because it's // [likely] not even in the standard list of known tags. if tag.ChildIfdName != "" && doDescend == true { ifdEnumerateLogger.Debugf(nil, "Descending to IFD [%s].", tag.ChildIfdName) childIi, _ := IfdIdOrFail(ii.IfdName, tag.ChildIfdName) err := ie.scan(childIi, tag.ValueOffset, visitor) log.PanicIf(err) } entries[i] = tag } nextIfdOffset, _, err = ite.getUint32() log.PanicIf(err) ifdEnumerateLogger.Debugf(nil, "Next IFD at offset: (%08x)", nextIfdOffset) return nextIfdOffset, entries, nil } // Scan enumerates the different EXIF blocks (called IFDs). func (ie *IfdEnumerate) scan(ii IfdIdentity, ifdOffset uint32, visitor TagVisitor) (err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() for ifdIndex := 0;; ifdIndex++ { ifdEnumerateLogger.Debugf(nil, "Parsing IFD [%s] (%d) at offset (%04x).", ii.IfdName, ifdIndex, ifdOffset) ite := ie.getTagEnumerator(ifdOffset) nextIfdOffset, _, err := ie.ParseIfd(ii, ifdIndex, ite, visitor, true) log.PanicIf(err) if nextIfdOffset == 0 { break } ifdOffset = nextIfdOffset } return nil } // Scan enumerates the different EXIF blocks (called IFDs). func (ie *IfdEnumerate) Scan(ifdOffset uint32, visitor TagVisitor) (err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() ii, _ := IfdIdOrFail("", IfdStandard) err = ie.scan(ii, ifdOffset, visitor) log.PanicIf(err) return nil } type Ifd struct { ByteOrder binary.ByteOrder Id int ParentIfd *Ifd Name string Index int Offset uint32 Entries []*IfdTagEntry EntriesByTagId map[uint16][]*IfdTagEntry Children []*Ifd NextIfdOffset uint32 NextIfd *Ifd } // FindTagWithId returns a list of tags (usually just zero or one) that match // the given tag ID. This is efficient. func (ifd Ifd) FindTagWithId(tagId uint16) (results []*IfdTagEntry, err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() results, found := ifd.EntriesByTagId[tagId] if found != true { log.Panic(ErrTagNotFound) } return results, nil } // FindTagWithName returns a list of tags (usually just zero or one) that match // the given tag name. This is not efficient (though the labor is trivial). func (ifd Ifd) FindTagWithName(tagName string) (results []*IfdTagEntry, err error) { defer func() { if state := recover(); state != nil { err = log.Wrap(state.(error)) } }() ti := NewTagIndex() ii := ifd.Identity() it, err := ti.GetWithName(ii, tagName) if log.Is(err, ErrTagNotFound) == true { log.Panic(ErrTagNotStandard) } else if err != nil { log.Panic(err) } results = make([]*IfdTagEntry, 0) for _, ite := range ifd.Entries { if ite.TagId == it.Id { results = append(results, ite) } } if len(results) == 0 { log.Panic(ErrTagNotFound) } return results, nil } func (ifd Ifd) String() string { parentOffset := uint32(0) if ifd.ParentIfd != nil { parentOffset = ifd.ParentIfd.Offset } return fmt.Sprintf("IFD