/* Copyright 2011 Google Inc. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. nYou may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ // Package magic implements MIME type sniffing of data based on the // well-known "magic" number prefixes in the file. package magic import ( "bytes" "io" "net/http" "strings" ) type prefixEntry struct { prefix []byte mtype string } var prefixTable = []prefixEntry{ {[]byte("GIF87a"), "image/gif"}, {[]byte("GIF89a"), "image/gif"}, // TODO: Others? {[]byte("\xff\xd8\xff\xe2"), "image/jpeg"}, {[]byte("\xff\xd8\xff\xe1"), "image/jpeg"}, {[]byte("\xff\xd8\xff\xe0"), "image/jpeg"}, {[]byte("\xff\xd8\xff\xdb"), "image/jpeg"}, {[]byte("\x49\x49\x2a\x00\x10\x00\x00\x00\x43\x52\x02"), "image/cr2"}, {[]byte{137, 'P', 'N', 'G', '\r', '\n', 26, 10}, "image/png"}, {[]byte("-----BEGIN PGP PUBLIC KEY BLOCK---"), "text/x-openpgp-public-key"}, {[]byte{'I', 'D', '3'}, "audio/mpeg"}, // TODO(bradfitz): popular audio & video formats at least } // MIMEType returns the MIME type from the data in the provided header // of the data. // It returns the empty string if the MIME type can't be determined. func MIMEType(hdr []byte) string { hlen := len(hdr) for _, pte := range prefixTable { plen := len(pte.prefix) if hlen > plen && bytes.Equal(hdr[:plen], pte.prefix) { return pte.mtype } } t := http.DetectContentType(hdr) t = strings.Replace(t, "; charset=utf-8", "", 1) if t != "application/octet-stream" && t != "text/plain" { return t } return "" } // MIMETypeFromReader takes a reader, sniffs the beginning of it, // and returns the mime (if sniffed, else "") and a new reader // that's the concatenation of the bytes sniffed and the remaining // reader. func MIMETypeFromReader(r io.Reader) (mime string, reader io.Reader) { var buf bytes.Buffer io.CopyN(&buf, r, 1024) mime = MIMEType(buf.Bytes()) return mime, io.MultiReader(&buf, r) } // MIMETypeFromReader takes a ReaderAt, sniffs the beginning of it, // and returns the MIME type if sniffed, else the empty string. func MIMETypeFromReaderAt(ra io.ReaderAt) (mime string) { var buf [1024]byte n, _ := ra.ReadAt(buf[:], 0) return MIMEType(buf[:n]) }