-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathCutBytes.java
executable file
·378 lines (342 loc) · 12.2 KB
/
CutBytes.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
package bytearray_cut_bytes;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.File;
import java.io.FileOutputStream;
import java.io.FilterInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.net.HttpURLConnection;
import java.net.URL;
import java.net.URLConnection;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.Comparator;
public class CutBytes {
public byte[] getBytes() throws IOException {
URLConnection connection=(new URL("file:///d:/temp.html")).openConnection();
connection.setDoInput(true);
//connection.setDoOutput(true);
connection.connect();
InputStream inputStream=connection.getInputStream();
ByteArrayOutputStream output=new ByteArrayOutputStream();
// this.copyFromInputToOutput(inputStream, output);
this.copyFromInputToOutput(inputStream,
output,
new ArrayList<String>(){
{
this.add("<script");
}
},
new ArrayList<String>(){
{
this.add("</script>");
this.add("/>");
}
}
);
return output.toByteArray();
}
private void copyFromInputToOutput(InputStream inputStream, OutputStream outputStream) throws IOException{
byte[] buffer=new byte[400];
int byteCount=0;
while((byteCount=inputStream.read(buffer))!=(-1)){
outputStream.write(buffer,0,byteCount);
}
}
/** ïîëó÷èòü èç ñïèñêà ñòðîê îòñîðòèðîâàííûé ñïèñîê ïî âîçðàñòàíèþ ðàçìåðà è ïðåîáðàçîâàòü åãî â ìàññèâ áàéò */
private ArrayList<byte[]> getSortByLengthList(ArrayList<String> list){
Collections.sort(list, new Comparator<String>(){
@Override
public int compare(String o1, String o2) {
if(o1==null&&o2==null)return 0;
if(o1==null&&o2!=null)return -1;
if(o1!=null&&o2==null)return 1;
if(o1.length()==o2.length())return 0;
if(o1.length()>o2.length())return -1;
return 1;
}
});
ArrayList<byte[]> returnValue=new ArrayList<byte[]>(list.size());
for(int index=0;index<list.size();index++){
returnValue.add(list.get(index).getBytes());
}
return returnValue;
}
/**
* êîïèðîâàíèå èç èñòî÷íèêà â ïðèåìíèê
* @param inputStream - èñòî÷íèê äàííûõ
* @param outputStream - ïðèåìíèê äàííûõ
* @param removeBegin - ñïèñîê èç ñòðîê, êîòîðûå ñèãíàëèçèðóþò î íà÷àëå áëîêà, êîòîðûé íå äîëæåí ïîïàñòü â âûáîðêó
* @param removeEnd - ñïèñîê èç ñòðîê, êîòîðûå ñèãíàëèçèðóþò îá îêîí÷àíèè áëîêà, êîòîðûé íå äîëæåí ïîïàñòü â âûáîðêó
* @throws IOException
*/
private void copyFromInputToOutput(InputStream inputStream,
OutputStream outputStream,
ArrayList<String> removeBegin,
ArrayList<String> removeEnd) throws IOException{
ArrayList<byte[]> beginBytes=this.getSortByLengthList(removeBegin);
ArrayList<byte[]> endBytes=this.getSortByLengthList(removeEnd);
/** ôëàã, êîòîðûé ãîâîðèò î òîì ÷òî çàïèñü ïðîèçâîäèòñÿ */
boolean flagWrite=true;
byte[] buffer=new byte[12];
int readCount=0;
while((readCount=inputStream.read(buffer))!=(-1)){
// System.out.println(new String(buffer));
while(true){
try{
if(flagWrite==true){
// find removeBegin
if(detectBeginIntoArray(buffer, 0, readCount, beginBytes)){
FindElementPosition position=getIndexOfSearchByteArray(buffer, readCount, beginBytes);
if(position==null){
outputStream.write(buffer, 0, readCount);
break;
}
// çàïèñàòü ïåðåä íàéäåííûì áëîêîì âñå äàííûå â OutputStream
outputStream.write(buffer, 0, position.getStartPosition());
outputStream.flush();
// âûðåçàòü áàéòû èç îñíîâíîãî áóôåðà
this.shiftLeftBytes(buffer, readCount, position.getStartPosition()+beginBytes.get(position.getIndexOfElement()).length);
// ñìåñòèòü óêàçàòåëü íà ïîñëåäíèé áàéò
readCount=readCount-(beginBytes.get(position.getIndexOfElement()).length+position.getStartPosition());
flagWrite=false;
continue;
}else{
// ìàðêåð íà÷àëà ïðîïóñêà çàïèñàííûõ áàéò íå íàéäåí
outputStream.write(buffer,0,readCount);
outputStream.flush();
break;
}
}else{
// find removeEnd
if(detectBeginIntoArray(buffer, 0, readCount, endBytes)){
FindElementPosition position=getIndexOfSearchByteArray(buffer, readCount, endBytes);
if(position==null)break;
// çàïèñàòü äàííûå íå íóæíî, ò.ê. ñòîèò ôëàã "ÍÅ çàïèñûâàòü"
// outputStream.write(buffer, 0, position.getIndexOfElement());
// âûðåçàòü áàéòû èç îñíîâíîãî áóôåðà
this.shiftLeftBytes(buffer, readCount, position.getStartPosition()+endBytes.get(position.getIndexOfElement()).length);
// ñìåñòèòü óêàçàòåëü íà ïîñëåäíèé áàéò
readCount=readCount-(endBytes.get(position.getIndexOfElement()).length+position.getStartPosition());
flagWrite=true;
continue;
}else{
// ìàðêåð îêîí÷àíèÿ ïðîïóñêà çàïèñàííûõ áàéò íå íàéäåí
// outputStream.write(buffer,0,readCount);
// outputStream.flush();
break;
}
}
}catch(NeedDataException ex){
BooleanWrap flagDone=new BooleanWrap(false);
buffer=addDataToBuffer(buffer, readCount, inputStream, ex.getNeedDataForRead(),flagDone);
if(flagDone.getValue()){
readCount=flagDone.getSize();
}else{
if(flagWrite){
outputStream.write(buffer);
outputStream.flush();
}
}
}
}
}
}
/** äîáàâèòü äàííûå â áóôåð, åñëè íåò äàííûõ - âûáðîñèòü Exception */
private byte[] addDataToBuffer(byte[] buffer, int readCount,InputStream inputStream, int needDataForRead, BooleanWrap flagDone){
// System.out.println("#addDataToBuffer before:"+new String(buffer));
if(buffer.length>=(readCount+needDataForRead)){
// áóôåð óâåëè÷èâàòü íå íóæíî
try{
int readedBytes=inputStream.read(buffer, readCount, needDataForRead);
if(readedBytes<needDataForRead){
flagDone.setSize(readedBytes+readCount);
flagDone.setValue(false);
}else{
flagDone.setSize(readedBytes+readCount);
flagDone.setValue(true);
}
}catch(IOException ex){
flagDone.setSize(readCount);
flagDone.setValue(false);
}
// System.out.println("#addDataToBuffer after:"+new String(buffer));
return buffer;
}else{
// áóôåð íóæíî óâåëè÷èòü
byte[] newBuffer=new byte[buffer.length+needDataForRead];
for(int index=0;index<buffer.length;index++)newBuffer[index]=buffer[index];
try{
int readedBytes=inputStream.read(newBuffer, buffer.length, needDataForRead);
if(readedBytes<needDataForRead){
flagDone.setSize(buffer.length+readedBytes);
flagDone.setValue(false);
}else{
flagDone.setSize(newBuffer.length);
flagDone.setValue(true);
}
}catch(IOException ex){
flagDone.setSize(readCount);
flagDone.setValue(false);
}
// System.out.println("#addDataToBuffer after:"+new String(newBuffer));
return newBuffer;
}
}
/**
* ñêîïèðîâàòü âñå äàííûå èç óêàçàííîãî áóôåðà
* @param buffer - óðåçàåìûé áóôåð
* @param readIndex - èíäåêñ íà÷àëà â áóôåðå
* @param readCount - èíäåêñ îêîí÷àíèÿ â áóôåðå
* @param shiftCount - ñìåñòèòü
*
*/
private void shiftLeftBytes(byte[] buffer, int readCount, int shiftCount) {
// System.out.println("shiftLeftBytes before:"+new String(buffer));
for(int index=shiftCount;index<readCount;index++){
buffer[index-shiftCount]=buffer[index];
}
// System.out.println("shiftLeftBytes after:"+new String(buffer));
}
/**
* ïîëó÷èòü èç ìàññèâà áàéò ( îãîâîðåííîãî ãðàíèöàìè ) èíäåêñ è íà÷àëüíîå ïîëîæåíèå îäíîãî èç ïåðåäàííûõ ìàññèâîâ â ñïèñêå
* @param buffer - áóôåð áàéò
* @param readIndex - èíäåêñ íà÷àëà
* @param readCount - èíäåêñ îêîí÷àíèÿ
* @param beginBytes - ñïèñîê èñêîìûõ ìàññèâîâ
* @return null åñëè íè îäíà èç ïîñëåäîâàòåëüíîñòåé íå íàéäåíà
*/
private FindElementPosition getIndexOfSearchByteArray(byte[] buffer, int limit, ArrayList<byte[]> beginBytes) throws NeedDataException{
// System.out.println("#getIndexOfSearchByteArray source:"+new String(buffer));
FindElementPosition returnValue=null;
for(int counter=0;counter<beginBytes.size();counter++){
int startPosition=this.getFirstIndexOfArray(buffer, limit, beginBytes.get(counter));
if(startPosition>=0){
returnValue=new FindElementPosition(counter, startPosition);
break;
}
}
return returnValue;
}
/**
* @param buffer êîòîðûé
* @param limit
* @param findArray
* @return
*/
private int getFirstIndexOfArray(byte[] buffer, int limit, byte[] findArray) throws NeedDataException{
// System.out.println("#getFirstIndexOfArray buffer:"+new String(buffer)+"\n find: "+new String(findArray));
int position=-1;
while( (position=getFirstIndexOfElement(buffer,limit,position+1, findArray[0]))>=0){
int counter=0;
for(counter=0;counter<findArray.length;counter++){
try{
if(buffer[position+counter]!=findArray[counter]){
break;
}else{
}
}catch(IndexOutOfBoundsException ex){
throw new NeedDataException(position-counter);
}
}
if(counter==findArray.length){
// System.out.println("#getFirstIndexOfArray return:"+position);
return position;
}
}
// System.out.println("#getFirstIndexOfArray return: -1");
return -1;
}
/** ïîëó÷èòü èñêîìóþ ïîçèöèþ ñòàðòîâîãî çíà÷åíèÿ */
private int getFirstIndexOfElement(byte[] buffer, int limit, int startPosition, byte element){
int returnValue=(-1);
for(int index=startPosition; index<limit;index++){
if(buffer[index]==element){
returnValue=index;
break;
}
}
return returnValue;
}
/** ñèãíàëèçèðîâàíèå î íàõîæäåíèè â ìàññèâå áàéò íà÷àëüíîãî áàéòà èç ñïèñêà */
private boolean detectBeginIntoArray(byte[] buffer, int indexBegin, int count, ArrayList<byte[]> beginBytes) {
// System.out.println(new String(buffer));
boolean returnValue=false;
for(int index=0;index<beginBytes.size();index++){
if(getFirstIndexOfElement(buffer,
count,
indexBegin,
beginBytes.get(index)[0])>=0)return true;
}
return returnValue;
}
public static void main(String[] args){
try{
CutBytes cutBytes=new CutBytes();
FileOutputStream output=new FileOutputStream(new File("d:\\test.html"));
output.write(cutBytes.getBytes());
/*ArrayList<byte[]> listOfByte=cutBytes.getSortByLengthList(list);
for(int index=0;index<listOfByte.size();index++){
System.out.println(index+" : "+getStringFromArrayListOfByte(listOfByte.get(index)));
}*/
}catch(Exception ex){
System.err.println("Exception:"+ex.getMessage());
}
}
private static String getStringFromArrayListOfByte(byte[] bs) {
StringBuffer returnValue=new StringBuffer();
for(int index=0;index<bs.length;index++){
returnValue.append(bs[index]);
returnValue.append(" ");
}
return returnValue.toString();
}
}
class BooleanWrap{
private boolean flag=false;
private int size=0;
public BooleanWrap(boolean flag){
this.flag=flag;
}
public boolean getValue(){
return this.flag;
}
public void setValue(boolean flag){
this.flag=flag;
}
public int getSize(){
return this.size;
}
public void setSize(int size){
this.size=size;
}
}
/** êëàññ, êîòîðûé èäåíòèôèöèðóåò ïîçèöèþ è èíäåêñ ìàññèâà â ïîèñêå áàéò */
class FindElementPosition{
private int indexOfElement;
private int startPosition;
public FindElementPosition(int indexOfElement, int startPosition){
this.indexOfElement=indexOfElement;
this.startPosition=startPosition;
}
int getIndexOfElement(){
return this.indexOfElement;
}
int getStartPosition(){
return this.startPosition;
}
}
class NeedDataException extends Exception{
private final static long serialVersionUID=1L;
private int needDataForRead;
public NeedDataException(int needDataForRead){
this.needDataForRead=needDataForRead;
}
/** êîë-âî äàííûõ, êîòîðûå íóæíî ïðî÷åñòü */
public int getNeedDataForRead(){
return this.needDataForRead;
}
}