MimeUtils.java

  1/*
  2 * Copyright (C) 2010 The Android Open Source Project
  3 *
  4 * Licensed under the Apache License, Version 2.0 (the "License");
  5 * you may not use this file except in compliance with the License.
  6 * You may obtain a copy of the License at
  7 *
  8 *      http://www.apache.org/licenses/LICENSE-2.0
  9 *
 10 * Unless required by applicable law or agreed to in writing, software
 11 * distributed under the License is distributed on an "AS IS" BASIS,
 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 * See the License for the specific language governing permissions and
 14 * limitations under the License.
 15 */
 16package eu.siacs.conversations.utils;
 17
 18import android.content.Context;
 19import android.net.Uri;
 20import android.util.Log;
 21
 22import java.io.File;
 23import java.io.FileInputStream;
 24import java.io.IOException;
 25import java.io.InputStream;
 26import java.net.URL;
 27import java.util.HashMap;
 28import java.util.Map;
 29import java.util.Properties;
 30
 31import eu.siacs.conversations.Config;
 32import eu.siacs.conversations.entities.Transferable;
 33import eu.siacs.conversations.services.ExportBackupService;
 34
 35/**
 36 * Utilities for dealing with MIME types.
 37 * Used to implement java.net.URLConnection and android.webkit.MimeTypeMap.
 38 */
 39public final class MimeUtils {
 40    private static final Map<String, String> mimeTypeToExtensionMap = new HashMap<>();
 41    private static final Map<String, String> extensionToMimeTypeMap = new HashMap<>();
 42
 43    static {
 44        // The following table is based on /etc/mime.types data minus
 45        // chemical/* MIME types and MIME types that don't map to any
 46        // file extensions. We also exclude top-level domain names to
 47        // deal with cases like:
 48        //
 49        // mail.google.com/a/google.com
 50        //
 51        // and "active" MIME types (due to potential security issues).
 52        // Note that this list is _not_ in alphabetical order and must not be sorted.
 53        // The "most popular" extension must come first, so that it's the one returned
 54        // by guessExtensionFromMimeType.
 55        add("application/andrew-inset", "ez");
 56        add("application/dsptype", "tsp");
 57        add("application/epub+zip", "epub");
 58        add("application/gpx+xml", "gpx");
 59        add("application/hta", "hta");
 60        add("application/mac-binhex40", "hqx");
 61        add("application/mathematica", "nb");
 62        add("application/msaccess", "mdb");
 63        add("application/oda", "oda");
 64        add("application/ogg", "ogg");
 65        add("application/pdf", "pdf");
 66        add("application/pgp-keys", "key");
 67        add("application/pgp-signature", "pgp");
 68        add("application/pics-rules", "prf");
 69        add("application/pkix-cert", "cer");
 70        add("application/rar", "rar");
 71        add("application/rdf+xml", "rdf");
 72        add("application/rss+xml", "rss");
 73        add("application/zip", "zip");
 74        add("application/vnd.amazon.mobi8-ebook", "azw3");
 75        add("application/vnd.amazon.mobi8-ebook", "azw");
 76        add("application/vnd.amazon.mobi8-ebook", "kfx");
 77        add("application/vnd.android.package-archive", "apk");
 78        add("application/vnd.cinderella", "cdy");
 79        add(ExportBackupService.MIME_TYPE, "ceb");
 80        add("application/vnd.ms-pki.stl", "stl");
 81        add("application/vnd.oasis.opendocument.database", "odb");
 82        add("application/vnd.oasis.opendocument.formula", "odf");
 83        add("application/vnd.oasis.opendocument.graphics", "odg");
 84        add("application/vnd.oasis.opendocument.graphics-template", "otg");
 85        add("application/vnd.oasis.opendocument.image", "odi");
 86        add("application/vnd.oasis.opendocument.spreadsheet", "ods");
 87        add("application/vnd.oasis.opendocument.spreadsheet-template", "ots");
 88        add("application/vnd.oasis.opendocument.text", "odt");
 89        add("application/vnd.oasis.opendocument.text-master", "odm");
 90        add("application/vnd.oasis.opendocument.text-template", "ott");
 91        add("application/vnd.oasis.opendocument.text-web", "oth");
 92        add("application/vnd.google-earth.kml+xml", "kml");
 93        add("application/vnd.google-earth.kmz", "kmz");
 94        add("application/msword", "doc");
 95        add("application/msword", "dot");
 96        add("application/vnd.openxmlformats-officedocument.wordprocessingml.document", "docx");
 97        add("application/vnd.openxmlformats-officedocument.wordprocessingml.template", "dotx");
 98        add("application/vnd.ms-excel", "xls");
 99        add("application/vnd.ms-excel", "xlt");
100        add("application/vnd.openxmlformats-officedocument.spreadsheetml.sheet", "xlsx");
101        add("application/vnd.openxmlformats-officedocument.spreadsheetml.template", "xltx");
102        add("application/vnd.ms-powerpoint", "ppt");
103        add("application/vnd.ms-powerpoint", "pot");
104        add("application/vnd.ms-powerpoint", "pps");
105        add("application/vnd.openxmlformats-officedocument.presentationml.presentation", "pptx");
106        add("application/vnd.openxmlformats-officedocument.presentationml.template", "potx");
107        add("application/vnd.openxmlformats-officedocument.presentationml.slideshow", "ppsx");
108        add("application/vnd.rim.cod", "cod");
109        add("application/vnd.smaf", "mmf");
110        add("application/vnd.stardivision.calc", "sdc");
111        add("application/vnd.stardivision.draw", "sda");
112        add("application/vnd.stardivision.impress", "sdd");
113        add("application/vnd.stardivision.impress", "sdp");
114        add("application/vnd.stardivision.math", "smf");
115        add("application/vnd.stardivision.writer", "sdw");
116        add("application/vnd.stardivision.writer", "vor");
117        add("application/vnd.stardivision.writer-global", "sgl");
118        add("application/vnd.sun.xml.calc", "sxc");
119        add("application/vnd.sun.xml.calc.template", "stc");
120        add("application/vnd.sun.xml.draw", "sxd");
121        add("application/vnd.sun.xml.draw.template", "std");
122        add("application/vnd.sun.xml.impress", "sxi");
123        add("application/vnd.sun.xml.impress.template", "sti");
124        add("application/vnd.sun.xml.math", "sxm");
125        add("application/vnd.sun.xml.writer", "sxw");
126        add("application/vnd.sun.xml.writer.global", "sxg");
127        add("application/vnd.sun.xml.writer.template", "stw");
128        add("application/vnd.visio", "vsd");
129        add("application/x-abiword", "abw");
130        add("application/x-apple-diskimage", "dmg");
131        add("application/x-bcpio", "bcpio");
132        add("application/x-bittorrent", "torrent");
133        add("application/x-cdf", "cdf");
134        add("application/x-cdlink", "vcd");
135        add("application/x-chess-pgn", "pgn");
136        add("application/x-cpio", "cpio");
137        add("application/x-debian-package", "deb");
138        add("application/x-debian-package", "udeb");
139        add("application/x-director", "dcr");
140        add("application/x-director", "dir");
141        add("application/x-director", "dxr");
142        add("application/x-dms", "dms");
143        add("application/x-doom", "wad");
144        add("application/x-dvi", "dvi");
145        add("application/x-font", "pfa");
146        add("application/x-font", "pfb");
147        add("application/x-font", "gsf");
148        add("application/x-font", "pcf");
149        add("application/x-font", "pcf.Z");
150        add("application/x-freemind", "mm");
151        // application/futuresplash isn't IANA, so application/x-futuresplash should come first.
152        add("application/x-futuresplash", "spl");
153        add("application/futuresplash", "spl");
154        add("application/x-gnumeric", "gnumeric");
155        add("application/x-go-sgf", "sgf");
156        add("application/x-graphing-calculator", "gcf");
157        add("application/x-gtar", "tgz");
158        add("application/x-gtar", "gtar");
159        add("application/x-gtar", "taz");
160        add("application/x-hdf", "hdf");
161        add("application/x-ica", "ica");
162        add("application/x-internet-signup", "ins");
163        add("application/x-internet-signup", "isp");
164        add("application/x-iphone", "iii");
165        add("application/x-iso9660-image", "iso");
166        add("application/x-jmol", "jmz");
167        add("application/x-kchart", "chrt");
168        add("application/x-killustrator", "kil");
169        add("application/x-koan", "skp");
170        add("application/x-koan", "skd");
171        add("application/x-koan", "skt");
172        add("application/x-koan", "skm");
173        add("application/x-kpresenter", "kpr");
174        add("application/x-kpresenter", "kpt");
175        add("application/x-kspread", "ksp");
176        add("application/x-kword", "kwd");
177        add("application/x-kword", "kwt");
178        add("application/x-latex", "latex");
179        add("application/x-lha", "lha");
180        add("application/x-lzh", "lzh");
181        add("application/x-lzx", "lzx");
182        add("application/x-maker", "frm");
183        add("application/x-maker", "maker");
184        add("application/x-maker", "frame");
185        add("application/x-maker", "fb");
186        add("application/x-maker", "book");
187        add("application/x-maker", "fbdoc");
188        add("application/x-mif", "mif");
189        add("application/x-mobipocket-ebook", "mobi");
190        add("application/x-ms-wmd", "wmd");
191        add("application/x-ms-wmz", "wmz");
192        add("application/x-msi", "msi");
193        add("application/x-ns-proxy-autoconfig", "pac");
194        add("application/x-nwc", "nwc");
195        add("application/x-object", "o");
196        add("application/x-oz-application", "oza");
197        add("application/x-pem-file", "pem");
198        add("application/x-pkcs12", "p12");
199        add("application/x-pkcs12", "pfx");
200        add("application/x-pkcs7-certreqresp", "p7r");
201        add("application/x-pkcs7-crl", "crl");
202        add("application/x-quicktimeplayer", "qtl");
203        add("application/x-shar", "shar");
204        add("application/x-shockwave-flash", "swf");
205        add("application/x-stuffit", "sit");
206        add("application/x-sv4cpio", "sv4cpio");
207        add("application/x-sv4crc", "sv4crc");
208        add("application/x-tar", "tar");
209        add("application/x-texinfo", "texinfo");
210        add("application/x-texinfo", "texi");
211        add("application/x-troff", "t");
212        add("application/x-troff", "roff");
213        add("application/x-troff-man", "man");
214        add("application/x-ustar", "ustar");
215        add("application/x-wais-source", "src");
216        add("application/x-wingz", "wz");
217        add("application/x-webarchive", "webarchive");
218        add("application/x-webarchive-xml", "webarchivexml");
219        add("application/x-x509-ca-cert", "crt");
220        add("application/x-x509-user-cert", "crt");
221        add("application/x-x509-server-cert", "crt");
222        add("application/x-xcf", "xcf");
223        add("application/x-xfig", "fig");
224        add("application/xhtml+xml", "xhtml");
225        add("audio/3gpp", "3gpp");
226        add("audio/aac", "aac");
227        add("audio/aac-adts", "aac");
228        add("audio/amr", "amr");
229        add("audio/amr-wb", "awb");
230        add("audio/basic", "snd");
231        add("audio/flac", "flac");
232        add("application/x-flac", "flac");
233        add("audio/imelody", "imy");
234        add("audio/midi", "mid");
235        add("audio/midi", "midi");
236        add("audio/midi", "ota");
237        add("audio/midi", "kar");
238        add("audio/midi", "rtttl");
239        add("audio/midi", "xmf");
240        add("audio/mobile-xmf", "mxmf");
241        // add ".mp3" first so it will be the default for guessExtensionFromMimeType
242        add("audio/mpeg", "mp3");
243        add("audio/mpeg", "mpga");
244        add("audio/mpeg", "mpega");
245        add("audio/mpeg", "mp2");
246        add("audio/mpeg", "m4a");
247        add("audio/mpegurl", "m3u");
248        add("audio/ogg", "oga");
249        add("audio/prs.sid", "sid");
250        add("audio/x-aiff", "aif");
251        add("audio/x-aiff", "aiff");
252        add("audio/x-aiff", "aifc");
253        add("audio/x-gsm", "gsm");
254        add("audio/x-matroska", "mka");
255        add("audio/x-mpegurl", "m3u");
256        add("audio/x-ms-wma", "wma");
257        add("audio/x-ms-wax", "wax");
258        add("audio/x-pn-realaudio", "ra");
259        add("audio/x-pn-realaudio", "rm");
260        add("audio/x-pn-realaudio", "ram");
261        add("audio/x-realaudio", "ra");
262        add("audio/x-scpls", "pls");
263        add("audio/x-sd2", "sd2");
264        add("audio/x-wav", "wav");
265        // image/bmp isn't IANA, so image/x-ms-bmp should come first.
266        add("image/x-ms-bmp", "bmp");
267        add("image/bmp", "bmp");
268        add("image/gif", "gif");
269        // image/ico isn't IANA, so image/x-icon should come first.
270        add("image/x-icon", "ico");
271        add("image/ico", "cur");
272        add("image/ico", "ico");
273        add("image/ief", "ief");
274        add("image/heic", "heic");
275        // add ".jpg" first so it will be the default for guessExtensionFromMimeType
276        add("image/jpeg", "jpg");
277        add("image/jpeg", "jpeg");
278        add("image/jpeg", "jpe");
279        add("image/jpeg", "jfif");
280        add("image/jpeg", "jif");
281        add("image/pcx", "pcx");
282        add("image/png", "png");
283        add("image/svg+xml", "svg");
284        add("image/svg+xml", "svgz");
285        add("image/tiff", "tiff");
286        add("image/tiff", "tif");
287        add("image/vnd.djvu", "djvu");
288        add("image/vnd.djvu", "djv");
289        add("image/vnd.wap.wbmp", "wbmp");
290        add("image/webp", "webp");
291        add("image/x-cmu-raster", "ras");
292        add("image/x-coreldraw", "cdr");
293        add("image/x-coreldrawpattern", "pat");
294        add("image/x-coreldrawtemplate", "cdt");
295        add("image/x-corelphotopaint", "cpt");
296        add("image/x-jg", "art");
297        add("image/x-jng", "jng");
298        add("image/x-photoshop", "psd");
299        add("image/x-portable-anymap", "pnm");
300        add("image/x-portable-bitmap", "pbm");
301        add("image/x-portable-graymap", "pgm");
302        add("image/x-portable-pixmap", "ppm");
303        add("image/x-rgb", "rgb");
304        add("image/x-xbitmap", "xbm");
305        add("image/x-xpixmap", "xpm");
306        add("image/x-xwindowdump", "xwd");
307        add("model/iges", "igs");
308        add("model/iges", "iges");
309        add("model/mesh", "msh");
310        add("model/mesh", "mesh");
311        add("model/mesh", "silo");
312        add("text/calendar", "ics");
313        add("text/calendar", "icz");
314        add("text/comma-separated-values", "csv");
315        add("text/css", "css");
316        add("text/html", "htm");
317        add("text/html", "html");
318        add("text/h323", "323");
319        add("text/iuls", "uls");
320        add("text/mathml", "mml");
321        // add ".txt" first so it will be the default for guessExtensionFromMimeType
322        add("text/plain", "txt");
323        add("text/plain", "asc");
324        add("text/plain", "text");
325        add("text/plain", "diff");
326        add("text/plain", "po");     // reserve "pot" for vnd.ms-powerpoint
327        add("text/richtext", "rtx");
328        add("text/rtf", "rtf");
329        add("text/text", "phps");
330        add("text/tab-separated-values", "tsv");
331        add("text/xml", "xml");
332        add("text/x-bibtex", "bib");
333        add("text/x-boo", "boo");
334        add("text/x-c++hdr", "hpp");
335        add("text/x-c++hdr", "h++");
336        add("text/x-c++hdr", "hxx");
337        add("text/x-c++hdr", "hh");
338        add("text/x-c++src", "cpp");
339        add("text/x-c++src", "c++");
340        add("text/x-c++src", "cc");
341        add("text/x-c++src", "cxx");
342        add("text/x-chdr", "h");
343        add("text/x-component", "htc");
344        add("text/x-csh", "csh");
345        add("text/x-csrc", "c");
346        add("text/x-dsrc", "d");
347        add("text/x-haskell", "hs");
348        add("text/x-java", "java");
349        add("text/x-literate-haskell", "lhs");
350        add("text/x-moc", "moc");
351        add("text/x-pascal", "p");
352        add("text/x-pascal", "pas");
353        add("text/x-pcs-gcd", "gcd");
354        add("text/x-setext", "etx");
355        add("text/x-tcl", "tcl");
356        add("text/x-tex", "tex");
357        add("text/x-tex", "ltx");
358        add("text/x-tex", "sty");
359        add("text/x-tex", "cls");
360        add("text/x-vcalendar", "vcs");
361        add("text/x-vcard", "vcf");
362        add("video/3gpp", "3gpp");
363        add("video/3gpp", "3gp");
364        add("video/3gpp2", "3gpp2");
365        add("video/3gpp2", "3g2");
366        add("video/avi", "avi");
367        add("video/dl", "dl");
368        add("video/dv", "dif");
369        add("video/dv", "dv");
370        add("video/fli", "fli");
371        add("video/m4v", "m4v");
372        add("video/mp2ts", "ts");
373        add("video/ogg", "ogv");
374        add("video/mpeg", "mpeg");
375        add("video/mpeg", "mpg");
376        add("video/mpeg", "mpe");
377        add("video/mp4", "mp4");
378        add("video/mpeg", "VOB");
379        add("video/quicktime", "qt");
380        add("video/quicktime", "mov");
381        add("video/vnd.mpegurl", "mxu");
382        add("video/webm", "webm");
383        add("video/x-la-asf", "lsf");
384        add("video/x-la-asf", "lsx");
385        add("video/x-matroska", "mkv");
386        add("video/x-mng", "mng");
387        add("video/x-ms-asf", "asf");
388        add("video/x-ms-asf", "asx");
389        add("video/x-ms-wm", "wm");
390        add("video/x-ms-wmv", "wmv");
391        add("video/x-ms-wmx", "wmx");
392        add("video/x-ms-wvx", "wvx");
393        add("video/x-sgi-movie", "movie");
394        add("video/x-webex", "wrf");
395        add("x-conference/x-cooltalk", "ice");
396        add("x-epoc/x-sisx-app", "sisx");
397        applyOverrides();
398    }
399
400    private static void add(String mimeType, String extension) {
401        // If we have an existing x -> y mapping, we do not want to
402        // override it with another mapping x -> y2.
403        // If a mime type maps to several extensions
404        // the first extension added is considered the most popular
405        // so we do not want to overwrite it later.
406        if (!mimeTypeToExtensionMap.containsKey(mimeType)) {
407            mimeTypeToExtensionMap.put(mimeType, extension);
408        }
409        if (!extensionToMimeTypeMap.containsKey(extension)) {
410            extensionToMimeTypeMap.put(extension, mimeType);
411        }
412    }
413
414    private static InputStream getContentTypesPropertiesStream() {
415        // User override?
416        String userTable = System.getProperty("content.types.user.table");
417        if (userTable != null) {
418            File f = new File(userTable);
419            if (f.exists()) {
420                try {
421                    return new FileInputStream(f);
422                } catch (IOException ignored) {
423                }
424            }
425        }
426        // Standard location?
427        File f = new File(System.getProperty("java.home"), "lib" + File.separator + "content-types.properties");
428        if (f.exists()) {
429            try {
430                return new FileInputStream(f);
431            } catch (IOException ignored) {
432            }
433        }
434        return null;
435    }
436
437    /**
438     * This isn't what the RI does. The RI doesn't have hard-coded defaults, so supplying your
439     * own "content.types.user.table" means you don't get any of the built-ins, and the built-ins
440     * come from "$JAVA_HOME/lib/content-types.properties".
441     */
442    private static void applyOverrides() {
443        // Get the appropriate InputStream to read overrides from, if any.
444        InputStream stream = getContentTypesPropertiesStream();
445        if (stream == null) {
446            return;
447        }
448        try {
449            try {
450                // Read the properties file...
451                Properties overrides = new Properties();
452                overrides.load(stream);
453                // And translate its mapping to ours...
454                for (Map.Entry<Object, Object> entry : overrides.entrySet()) {
455                    String extension = (String) entry.getKey();
456                    String mimeType = (String) entry.getValue();
457                    add(mimeType, extension);
458                }
459            } finally {
460                stream.close();
461            }
462        } catch (IOException ignored) {
463        }
464    }
465
466    private MimeUtils() {
467    }
468
469    /**
470     * Returns true if the given MIME type has an entry in the map.
471     *
472     * @param mimeType A MIME type (i.e. text/plain)
473     * @return True iff there is a mimeType entry in the map.
474     */
475    public static boolean hasMimeType(String mimeType) {
476        if (mimeType == null || mimeType.isEmpty()) {
477            return false;
478        }
479        return mimeTypeToExtensionMap.containsKey(mimeType);
480    }
481
482    /**
483     * Returns the MIME type for the given extension.
484     *
485     * @param extension A file extension without the leading '.'
486     * @return The MIME type for the given extension or null iff there is none.
487     */
488    public static String guessMimeTypeFromExtension(String extension) {
489        if (extension == null || extension.isEmpty()) {
490            return null;
491        }
492        return extensionToMimeTypeMap.get(extension.toLowerCase());
493    }
494
495    /**
496     * Returns true if the given extension has a registered MIME type.
497     *
498     * @param extension A file extension without the leading '.'
499     * @return True iff there is an extension entry in the map.
500     */
501    public static boolean hasExtension(String extension) {
502        if (extension == null || extension.isEmpty()) {
503            return false;
504        }
505        return extensionToMimeTypeMap.containsKey(extension);
506    }
507
508    /**
509     * Returns the registered extension for the given MIME type. Note that some
510     * MIME types map to multiple extensions. This call will return the most
511     * common extension for the given MIME type.
512     *
513     * @param mimeType A MIME type (i.e. text/plain)
514     * @return The extension for the given MIME type or null iff there is none.
515     */
516    public static String guessExtensionFromMimeType(String mimeType) {
517        if (mimeType == null || mimeType.isEmpty()) {
518            return null;
519        }
520        return mimeTypeToExtensionMap.get(mimeType.split(";")[0]);
521    }
522
523    public static String guessMimeTypeFromUriAndMime(final Context context, final Uri uri, final String mime) {
524        Log.d(Config.LOGTAG, "guessMimeTypeFromUriAndMime " + uri + " and mime=" + mime);
525        if (mime == null || mime.equals("application/octet-stream")) {
526            final String guess = guessMimeTypeFromUri(context, uri);
527            if (guess != null) {
528                return guess;
529            } else {
530                return mime;
531            }
532        }
533        return guessMimeTypeFromUri(context, uri);
534    }
535
536    public static String guessMimeTypeFromUri(Context context, Uri uri) {
537        // try the content resolver
538        String mimeType;
539        try {
540            mimeType = context.getContentResolver().getType(uri);
541        } catch (Throwable throwable) {
542            mimeType = null;
543        }
544        // try the extension
545        if ((mimeType == null || mimeType.equals("application/octet-stream")) && uri.getPath() != null) {
546            String path = uri.getPath();
547            int start = path.lastIndexOf('.') + 1;
548            if (start < path.length()) {
549                final String guess = MimeUtils.guessMimeTypeFromExtension(path.substring(start));
550                if (guess != null) {
551                    mimeType = guess;
552                }
553            }
554        }
555        // sometimes this works (as with the commit content api)
556        if (mimeType == null) {
557            mimeType = uri.getQueryParameter("mimeType");
558        }
559        return mimeType;
560    }
561
562    public static String extractRelevantExtension(URL url) {
563        String path = url.getPath();
564        return extractRelevantExtension(path, true);
565    }
566
567    public static String extractRelevantExtension(final String path) {
568        return extractRelevantExtension(path, false);
569    }
570
571    public static String extractRelevantExtension(final String path, final boolean ignoreCryptoExtension) {
572        if (path == null || path.isEmpty()) {
573            return null;
574        }
575
576        String filename = path.substring(path.lastIndexOf('/') + 1).toLowerCase();
577        int dotPosition = filename.lastIndexOf(".");
578
579        if (dotPosition != -1) {
580            String extension = filename.substring(dotPosition + 1);
581            // we want the real file extension, not the crypto one
582            if (ignoreCryptoExtension && Transferable.VALID_CRYPTO_EXTENSIONS.contains(extension)) {
583                return extractRelevantExtension(filename.substring(0, dotPosition));
584            } else {
585                return extension;
586            }
587        }
588        return null;
589    }
590}