| Classes in this File | Line Coverage | Branch Coverage | Complexity | ||||
| WhiteSpacesPurifier |
|
| 5.5;5.5 |
| 1 | /* | |
| 2 | * Licensed to the Apache Software Foundation (ASF) under one or more | |
| 3 | * contributor license agreements. See the NOTICE file distributed with | |
| 4 | * this work for additional information regarding copyright ownership. | |
| 5 | * The ASF licenses this file to You under the Apache License, Version 2.0 | |
| 6 | * (the "License"); you may not use this file except in compliance with | |
| 7 | * the License. You may obtain a copy of the License at | |
| 8 | * | |
| 9 | * http://www.apache.org/licenses/LICENSE-2.0 | |
| 10 | * | |
| 11 | * Unless required by applicable law or agreed to in writing, software | |
| 12 | * distributed under the License is distributed on an "AS IS" BASIS, | |
| 13 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| 14 | * See the License for the specific language governing permissions and | |
| 15 | * limitations under the License. | |
| 16 | */ | |
| 17 | ||
| 18 | package org.apache.any23.mime.purifier; | |
| 19 | ||
| 20 | import java.io.IOException; | |
| 21 | import java.io.InputStream; | |
| 22 | ||
| 23 | /** | |
| 24 | * Implementation of {@link Purifier} that removes all the eventual blank | |
| 25 | * characters at the header of a file that might prevents its <i>MIME Type</i> detection. | |
| 26 | * | |
| 27 | * @author Davide Palmisano ( dpalmisano@gmail.com ) | |
| 28 | */ | |
| 29 | 0 | public class WhiteSpacesPurifier implements Purifier { |
| 30 | ||
| 31 | /** | |
| 32 | * {@inheritDoc} | |
| 33 | */ | |
| 34 | public void purify(InputStream inputStream) throws IOException { | |
| 35 | 0 | if(!inputStream.markSupported()) |
| 36 | 0 | throw new IllegalArgumentException("Provided InputStream does not support marks"); |
| 37 | ||
| 38 | // mark the current position | |
| 39 | 0 | inputStream.mark(Integer.MAX_VALUE); |
| 40 | 0 | int byteRead = inputStream.read(); |
| 41 | 0 | char charRead = (char) byteRead; |
| 42 | 0 | while(isBlank(charRead) && (byteRead != -1)) { |
| 43 | // if here means that the previos character must be removed, so mark. | |
| 44 | 0 | inputStream.mark(Integer.MAX_VALUE); |
| 45 | 0 | byteRead = inputStream.read(); |
| 46 | 0 | charRead = (char) byteRead; |
| 47 | } | |
| 48 | // if exit go back to the last valid mark. | |
| 49 | 0 | inputStream.reset(); |
| 50 | 0 | } |
| 51 | ||
| 52 | private boolean isBlank(char c) { | |
| 53 | 0 | return c == '\t' || c == '\n' || c == ' ' || c == '\r' || c == '\b' || c == '\f'; |
| 54 | } | |
| 55 | } |