001package Torello.HTML.Tools.Images; 002 003import java.util.regex.*; 004import java.io.*; 005 006import java.awt.image.BufferedImage; 007import javax.imageio.ImageIO; 008import java.util.Base64; 009import java.net.URL; 010 011import Torello.Java.Additional.Ret2; 012 013/** 014 * An enumeration of the primary image-types available on the internet. 015 * 016 * <BR /><BR />This is just an enumerated-type used to ensure proper parameter-requests when 017 * downloading images. The type provides a simple means for storing words such as <code>'jpg,' 018 * 'png,' 'gif,' etc...</code> when attempting to download images. 019 * 020 * @see ImageScrape 021 * @see ImageScraper 022 */ 023public enum IF 024{ 025 // ******************************************************************************************** 026 // ******************************************************************************************** 027 // The Constants 028 // ******************************************************************************************** 029 // ******************************************************************************************** 030 031 032 /** 033 * Used to indicate a picture using the common {@code '.jpg'} image format. 034 * According to a <B>Yahoo! Search</B> link: 035 * 036 * <BR /><BR /><CODE> The JPEG file extension is used interchangeably 037 * with JPG. JPEG stands for Joint Photographic Experts Group who created the standard. 038 * JPG files have 2 sub-formats, JPG/ Exif (often used in digital cameras and photographic 039 * equipment), and JPG/ JFIF (often used on the World Wide Web).</CODE> 040 * 041 * <BR /><BR />What is JPG? What Opens a JPG? Exact Link: 042 * 043 * <BR /><BR /><A HREF="http://whatis.techtarget.com/fileformat/JPG-JPEG-bitmap" TARGET=_blank> 044 * http://whatis.techtarget.com/fileformat/JPG-JPEG-bitmap</A> 045 */ 046 JPG("jpg", "jpeg"), 047 048 /** 049 * Used to indicate a picture using the common ommon {@code '.gif'} image format. 050 * Short for <CODE><B>"Graphics Interchange Format".</B></CODE> 051 */ 052 GIF("gif"), 053 054 /** 055 * Used to indicate a picture using the common ommon {@code '.bmp'} image format. 056 * Abbreviation of the word <CODE><B>'Bit Map'</B></CODE> 057 */ 058 BMP("bmp"), 059 060 /** 061 * Used to indicate a picture using the common {@code '.png'} image format. 062 * <CODE><B>PNG</B></CODE> stands for <CODE><B>Portable Network Graphics.</B></CODE> 063 * It is an open source file extension for raster graphics files. 064 */ 065 PNG("png"); 066 067 068 // ******************************************************************************************** 069 // ******************************************************************************************** 070 // Fields 071 // ******************************************************************************************** 072 // ******************************************************************************************** 073 074 075 /** This is the actual file-name extension saved as a {@code String}. */ 076 public final String extension; 077 078 /** 079 * This field is always just null, except for the case of the {@code 'JPG'} Enumeration 080 * Constant. For that Image-Format this simply evaluates to the {@code String 'jpeg'}. 081 */ 082 public final String alternateExtension; 083 084 /** 085 * This will parse a {@code 'Base64' String} into two groups using Java's RegEx Tools. 086 * 087 * <BR /><DIV CLASS=EXAMPLE>{@code 088 * import java.util.regex.Matcher; 089 * ... 090 * 091 * Matcher m = IF.B64_INIT_STRING.matcher(base64String); 092 * if (m.find()) 093 * { ... } 094 * }</DIV> 095 * 096 * <BR /><BR /><OL CLASS=JDOL> 097 * <LI> {@code m.group(1) => } Image Encoding Type-{@code String} ({@code "gif", "jpg",} etc..) 098 * <BR /><BR /> 099 * </LI> 100 * <LI>{@code m.gropu(2) => } Base 64 Encoded Image-{@code String} 101 * <BR /> 102 * </LI> 103 * </OL> 104 */ 105 public static final Pattern B64_INIT_STRING = Pattern.compile( 106 "^\\s*data:\\s*image\\/\\s*([A-Za-z]{3,4})\\s*;\\s*base64\\s*,(.*)$", 107 Pattern.CASE_INSENSITIVE 108 ); 109 110 private static final IF[] arr = { JPG, GIF, BMP, PNG }; 111 112 113 // ******************************************************************************************** 114 // ******************************************************************************************** 115 // Constructors 116 // ******************************************************************************************** 117 // ******************************************************************************************** 118 119 120 // Used for GIF, BMP & PNG 121 private IF(String extension) 122 { 123 this.extension = extension; 124 this.alternateExtension = null; 125 } 126 127 // Used for JPG 128 private IF(String extension, String alternateExtension) 129 { 130 this.extension = extension; 131 this.alternateExtension = alternateExtension; 132 } 133 134 135 // ******************************************************************************************** 136 // ******************************************************************************************** 137 // "Guess the Extension" Methods 138 // ******************************************************************************************** 139 // ******************************************************************************************** 140 141 142 /** 143 * This will extract the file-extension from an image {@code URL}. Not all images on the 144 * internet have {@code URL's} that end with the actual image-file-type. In that case, or in 145 * the case that the {@code 'uriStr'} is a pointer to a non-image-file, {@code 'null'} will 146 * be returned. 147 * 148 * @param uriStr Is the {@code uri} or File-Name of an image. 149 * 150 * @return If extension has a file-extension that is listed in the {@code IF[]} Array - that 151 * file-extension will be returned, otherwise {@code 'null'} will be returned. 152 */ 153 public static IF getGuess(String uriStr) 154 { 155 if (uriStr == null) return null; 156 157 int pos = uriStr.lastIndexOf("."); 158 159 if (pos == -1) return null; 160 if (pos == uriStr.length() - 1) return null; 161 162 String s = uriStr.substring(pos + 1).toLowerCase().trim(); 163 164 // The following array is a private & static array defined above 165 // NOTE: private static final IF[] arr = { JPG, GIF, BMP, PNG }; 166 167 for (int i=0; i < arr.length; i++) 168 169 if (arr[i].extension.equals(s)) return arr[i]; 170 171 else if ( (arr[i].alternateExtension != null) 172 && (arr[i].alternateExtension.equals(s))) 173 174 return arr[i]; 175 176 return null; 177 } 178 179 /** 180 * Invokes {@link #getGuess(String)}, and returns the results - <I>unless the returned result 181 * would be null, in which case a {@link UnrecognizedImageExtException} is thrown instead</I>. 182 * 183 * @param uriStr Is the {@code uri} or File-Name of the image. 184 * 185 * @return The Image-Format of this Image, based on it's File-Name 186 * 187 * @throws UnrecognizedImageExtException If the Image-Type cannot be determined (does not match 188 * any) based on its File-Name Extension. ({@code '.jpg', '.png', '.gif'} etc...) 189 */ 190 public static IF guessOrThrow(String uriStr) 191 { 192 IF ret = getGuess(uriStr); 193 if (ret != null) return ret; 194 195 throw new UnrecognizedImageExtException( 196 "The URI or File-Name\n" + 197 "[" + uriStr + "]\n" + 198 "doesn't have a File-Extension that matches any of the recognized Image-Types " + 199 "('.jpg', '.png', '.gif' etc...)" 200 ); 201 } 202 203 /** 204 * Converts a {@code String} image-extension to an instance this enumerated type. 205 * @param extension A valid image-format extension 206 * @return An instance of this enumeration, if applicable, or {@code 'null'} otherwise. 207 */ 208 public static IF get(String extension) 209 { 210 extension = extension.toLowerCase().trim(); 211 212 // The following array is a private & static array defined above 213 // NOTE: private static final IF[] arr = { JPG, GIF, BMP, PNG }; 214 215 for (int i=0; i < arr.length; i++) 216 217 if (arr[i].extension.equals(extension)) return arr[i]; 218 219 else if ( (arr[i].alternateExtension != null) 220 && (arr[i].alternateExtension.equals(extension))) 221 222 return arr[i]; 223 224 return null; 225 } 226 227 /** 228 * This will retrieve the image name from a {@code java.net.URL} object. 229 * 230 * @param url The {@code url} of the image. 231 * 232 * @return If this {@code URL} has a file-extension that is listed in the {@code IF[]} Array, 233 * that file-extension will be returned, otherwise {@code 'null'} will be returned. 234 */ 235 public static IF getGuess(URL url) 236 { 237 String f = url.getFile(); 238 239 return (f != null) ? getGuess(f) : null; 240 } 241 242 243 // ******************************************************************************************** 244 // ******************************************************************************************** 245 // Decode Base-64 String Methods 246 // ******************************************************************************************** 247 // ******************************************************************************************** 248 249 250 /** 251 * This will retrieve a Buffered Image from a {@code String} retrieved from a string that 252 * follows this format below. This is the format usually found inside HTML Image Tags. 253 * 254 * <BR /><BR /><B>SPECIFICALLY: </B><SPAN STYLE="color: green;"> 255 * {@code <IMG SRC="data:image/{png or gif or jpg etc};base64,...">}</SPAN> 256 * 257 * <BR /><BR />The ellipsis (...) above represents the actual {@code Base-64} encoded 258 * {@code String}. Many web-sites return HTML image tags with the actual picture/image encoded 259 * into a {@code String} and saved inside the {@code 'SRC'} attribute. This method will decode 260 * that image-as-a-{@code String} into a {@code java.awt.image.BufferedImage} 261 * 262 * @param base64EncodedImageWithFormat The best way to obtain this {@code String} is to use the 263 * command [{@code String encoded = imageTag.AV("src"); }], and pass this variable 264 * {@code 'encoded'} to this parameter. It is important to note that variable 265 * {@code 'imageTag'} must be a {@code public class TagNode}, and that {@code TagNode} must: 266 * 267 * <BR /><BR /><UL CLASS=JDUL> 268 * <LI> Have {@code public final String tok} equal to {@code 'img'} 269 * <BR /><BR /> 270 * </LI> 271 * 272 * <LI> The {@code <IMG>} represented must have a {@code SRC="..."} which contains a 273 * {@code Base-64} encoded image. 274 * </LI> 275 * </UL> 276 * 277 * @return A decoded image that can be saved to file, and an instance of {@code IF} that 278 * identifies what type of image was specified. 279 * 280 * <BR /><BR /><UL CLASS=JDUL> 281 * <LI> {@code Ret2.a} (BufferedImage):} The Converted Image 282 * <BR /><BR /> 283 * </LI> 284 * 285 * <LI> {@code Ret2.b} (IF):} The Image Type 286 * </LI> 287 * </UL> 288 */ 289 public static Ret2<BufferedImage, IF> 290 decodeBase64ToImage(String base64EncodedImageWithFormat) 291 { 292 // sourceData = '...=='; 293 Matcher m = B64_INIT_STRING.matcher(base64EncodedImageWithFormat); 294 295 if (! m.find()) return null; 296 297 String imageFormatStr = m.group(1); 298 String base64EncodedImage = m.group(2); 299 300 IF imageFormat = (imageFormatStr != null) ? IF.get(imageFormatStr) : null; 301 302 if (imageFormat == null) return null; 303 304 BufferedImage bi = decodeBase64ToImage(base64EncodedImage, imageFormat); 305 306 if (bi == null) return null; 307 308 return new Ret2<BufferedImage, IF>(bi, imageFormat); 309 } 310 311 /** 312 * This will decode a {@code Base-64 String} into an image. Here, the decoder used is the one 313 * obtained from a call to: {@code java.util.Base64.getDecoder() }. 314 * 315 * <BR /><BR /><SPAN CLASS=CopiedJDK>Text copied from class: 316 * {@code java.util.Base64}, <B>JDK 1.8</B></SPAN> 317 * 318 * <BR /><BR /><B>Basic: </B> Uses "The Base64 Alphabet" as specified in <I><B>Table 1 of RFC 319 * 4648 and RFC 2045</B></I> for encoding and decoding operation. The encoder does not add any 320 * line feed (line separator) character. The decoder rejects data that contains characters 321 * outside the base64 alphabet. 322 * 323 * @return A decoded image that can be saved to file. 324 */ 325 public static BufferedImage decodeBase64ToImage(String base64EncodedImage, IF imageFormat) 326 { 327 try 328 (ByteArrayInputStream bis = new ByteArrayInputStream 329 (Base64.getDecoder().decode(base64EncodedImage))) 330 331 { return ImageIO.read(bis); } 332 333 catch (IOException e) { return null; } 334 } 335 336 /** 337 * This will decode a base-64 String into an image. Here, the decoder used is the one obtained 338 * from a call to: {@code java.util.Base64.getURLDecoder() }. 339 * 340 * <BR /><BR /><SPAN CLASS=CopiedJDK>Text copied from class: 341 * {@code java.util.Base64}, <B>JDK 1.8</B></SPAN> 342 * 343 * <BR /><BR /><B>URL and Filename safe: </B> Uses the "URL and Filename safe Base64 Alphabet" 344 * as specified in <B><I>Table 2 of RFC 4648</B></I> for encoding and decoding. The encoder 345 * does not add any line feed (line separator) character. The decoder rejects data that 346 * contains characters outside the base64 alphabet. 347 * 348 * @return A decoded image that can be saved to file. 349 */ 350 public static BufferedImage decodeBase64ToImage_V2(String base64EncodedImage, IF imageFormat) 351 { 352 try 353 (ByteArrayInputStream bis = new ByteArrayInputStream 354 (Base64.getUrlDecoder().decode(base64EncodedImage))) 355 356 { return ImageIO.read(bis); } 357 358 catch (IOException e) { return null; } 359 } 360 361 362 // ******************************************************************************************** 363 // ******************************************************************************************** 364 // java.lang.Object 365 // ******************************************************************************************** 366 // ******************************************************************************************** 367 368 369 /** 370 * Convert an instance of this enumerated-type to a {@code String}. 371 * @return The image-format extension as a {@code String}. 372 */ 373 public String toString() { return extension; } 374}