package tag import ( "crypto/sha1" "encoding/binary" "fmt" "hash" "io" "os" ) // Sum creates a checksum of the audio file data provided by the io.ReadSeeker which is metadata // (ID3, MP4) invariant. func Sum(r io.ReadSeeker) (string, error) { b, err := readBytes(r, 11) if err != nil { return "", err } _, err = r.Seek(-11, os.SEEK_CUR) if err != nil { return "", fmt.Errorf("could not seek back to original position: %v", err) } if string(b[4:11]) == "ftypM4A" { return SumAtoms(r) } if string(b[0:3]) == "ID3" { return SumID3v2(r) } h, err := SumID3v1(r) if err != nil { if err == ErrNotID3v1 { return SumAll(r) } return "", err } return h, nil } // SumAll returns a checksum of the content from the reader (until EOF). func SumAll(r io.ReadSeeker) (string, error) { h := sha1.New() _, err := io.Copy(h, r) if err != nil { return "", nil } return hashSum(h), nil } // SumAtoms constructs a checksum of MP4 audio file data provided by the io.ReadSeeker which is // metadata invariant. func SumAtoms(r io.ReadSeeker) (string, error) { for { var size uint32 err := binary.Read(r, binary.BigEndian, &size) if err != nil { if err == io.EOF { return "", fmt.Errorf("reached EOF before audio data") } return "", err } name, err := readString(r, 4) if err != nil { return "", err } switch name { case "meta": // next_item_id (int32) _, err := r.Seek(4, os.SEEK_CUR) if err != nil { return "", err } fallthrough case "moov", "udta", "ilst": return SumAtoms(r) case "mdat": // stop when we get to the data h := sha1.New() _, err := io.CopyN(h, r, int64(size-8)) if err != nil { return "", fmt.Errorf("error reading audio data: %v", err) } return hashSum(h), nil } _, err = r.Seek(int64(size-8), os.SEEK_CUR) if err != nil { return "", fmt.Errorf("error reading '%v' tag: %v", name, err) } } } // SumID3v1 constructs a checksum of MP3 audio file data (assumed to have ID3v1 tags) provided // by the io.ReadSeeker which is metadata invariant. func SumID3v1(r io.ReadSeeker) (string, error) { // Need to stop before we hit potential ID3v1 data. n, err := r.Seek(-128, os.SEEK_END) if err != nil { return "", fmt.Errorf("error seeking to the end of the file (minus ID3v1 header): %v", err) } // TODO: improve this check??? if n <= 0 { return "", fmt.Errorf("file size must be greater than 128 bytes (ID3v1 header size) for MP3") } // Seek back to the original position now! _, err = r.Seek(-1*n, os.SEEK_SET) if err != nil { return "", fmt.Errorf("error seeking back to the start of the data: %v", err) } h := sha1.New() _, err = io.CopyN(h, r, n) if err != nil { return "", fmt.Errorf("error reading %v bytes: %v", n, err) } return hashSum(h), nil } // SumID3v2 constructs a checksum of MP3 audio file data (assumed to have ID3v2 tags) provided by the // io.ReadSeeker which is metadata invariant. func SumID3v2(r io.ReadSeeker) (string, error) { header, err := readID3v2Header(r) if err != nil { return "", fmt.Errorf("error reading ID3v2 header: %v", err) } _, err = r.Seek(int64(header.Size)+10, os.SEEK_SET) if err != nil { return "", fmt.Errorf("error seeking to end of ID3V2 header: %v", err) } // Need to stop before we hit potential ID3v1 data. n, err := r.Seek(-128, os.SEEK_END) if err != nil { return "", fmt.Errorf("error seeking to the end of the file (minus ID3v1 header): %v", err) } // TODO: remove this check????? if n < 0 { return "", fmt.Errorf("file size must be greater than 128 bytes for MP3: %v bytes", n) } // Seek back to the original position now! _, err = r.Seek(-1*n, os.SEEK_SET) if err != nil { return "", fmt.Errorf("error seeking back to the start of the data: %v", err) } h := sha1.New() _, err = io.CopyN(h, r, n) if err != nil { return "", fmt.Errorf("error reading %v bytes: %v", n, err) } return hashSum(h), nil } func hashSum(h hash.Hash) string { return fmt.Sprintf("%x", h.Sum([]byte{})) }