Project

General

Profile

Download (4.17 KB) Statistics
| Branch: | Tag: | Revision:
1
/**
2
* Copyright (C) 2007 EDIT
3
* European Distributed Institute of Taxonomy 
4
* http://www.e-taxonomy.eu
5
* 
6
* The contents of this file are subject to the Mozilla Public License Version 1.1
7
* See LICENSE.TXT at the top of this package for the full license terms.
8
*/
9
package eu.etaxonomy.cdm.io.dwca.in;
10

    
11
import java.util.ArrayList;
12
import java.util.List;
13
import java.util.Map;
14
import java.util.Set;
15

    
16
import org.apache.log4j.Logger;
17

    
18
import eu.etaxonomy.cdm.io.dwca.TermUri;
19
import eu.etaxonomy.cdm.io.stream.StreamImportBase;
20
import eu.etaxonomy.cdm.io.stream.StreamImportConfiguratorBase;
21
import eu.etaxonomy.cdm.io.stream.StreamImportStateBase;
22
import eu.etaxonomy.cdm.model.common.CdmBase;
23
import eu.etaxonomy.cdm.model.common.IdentifiableEntity;
24
import eu.etaxonomy.cdm.model.reference.Reference;
25

    
26

    
27
/**
28
 * @author a.mueller
29
 *
30
 */
31
public class StreamPartitioner<ITEM extends IConverterInput>  implements INamespaceReader<IReader<MappedCdmBase>>{
32
	private static final Logger logger = Logger.getLogger(StreamPartitioner.class);
33
	
34
	private int partitionSize;
35
	private LookAheadStream<ITEM> inStream;
36
	private IPartitionableConverter converter;
37
	private StreamImportStateBase<StreamImportConfiguratorBase, StreamImportBase> state;
38
	private ConcatenatingReader<MappedCdmBase> outStream;
39
	
40
	public StreamPartitioner(INamespaceReader<ITEM> input, IPartitionableConverter converter, StreamImportStateBase state, Integer size){
41
		 this.inStream = new LookAheadStream<ITEM>(input);
42
		 this.converter = converter;
43
		 this.partitionSize = size;
44
		 this.state = state;
45
		 initNewOutStream();
46
	}
47
	
48

    
49
	private void initNewOutStream(){
50
		outStream = new ConcatenatingReader<MappedCdmBase>();
51
	}
52
	
53
	/* (non-Javadoc)
54
	 * @see eu.etaxonomy.cdm.io.dwca.in.IReader#hasNext()
55
	 */
56
	public boolean hasNext() {
57
		if (this.outStream.hasNext()){
58
			return true;
59
		}else{
60
			return inStream.hasNext();  //TODO what, if converter returns no ouput for inStream.hasNext() ??
61
			//but be aware that requesting the next object from the next partition crosses the transactional borders 
62
		}
63
	}
64
	
65
	@Override
66
	public IReader<MappedCdmBase> read() {
67
		logger.debug("Start partitioner read");
68
		handleNextPartition();
69
		IReader<MappedCdmBase> result = this.outStream;
70
		
71
		initNewOutStream();
72
		logger.debug("End partitioner read");
73
		return result;
74
	}
75
	
76
	private void handleNextPartition(){
77

    
78
		List<ITEM> lookaheadArray = new ArrayList<ITEM>();
79
		while (this.inStream.hasNextLookAhead(partitionSize)){
80
			lookaheadArray.add(this.inStream.readLookAhead());
81
		}
82
		
83
		IReader<ITEM> lookaheadStream = new ListReader<ITEM>(lookaheadArray);
84
		
85
		Map<String, Set<String>> foreignKeys = converter.getPartitionForeignKeys(lookaheadStream);
86
		IImportMapping mapping = state.getMapping();
87
		InMemoryMapping partialMapping = mapping.getPartialMapping(foreignKeys);
88
		Reference<?> sourceRef = state.getCurrentIO().getReferenceService().find(state.getConfig().getSourceRefUuid());
89
		partialMapping.putMapping(TermUri.CDM_SOURCE_REFERENCE.toString(), state.getConfig().getSourceRefUuid().toString(), sourceRef);
90
		
91
		state.loadRelatedObjects(partialMapping);
92
				
93
		while (inStream.isLookingAhead() && inStream.hasNext()){
94
			IReader<MappedCdmBase> resultReader = converter.map(inStream.read());
95
			List<MappedCdmBase> resultList = new ArrayList<MappedCdmBase>();  //maybe better let converter return list from the beginning
96
			while (resultReader.hasNext()){
97
				MappedCdmBase item = resultReader.read();
98
				resultList.add(item);
99
				addItemToRelatedObjects(item);
100
			}
101
			outStream.add(new ListReader<MappedCdmBase>(resultList));
102
		}
103
			
104
		return;
105

    
106
	}
107

    
108
	
109
	/**
110
	 * Add new items to the local mapping
111
	 * @param item
112
	 */
113
	private void addItemToRelatedObjects(MappedCdmBase<IdentifiableEntity> item) {
114
		CdmBase cdmBase = item.getCdmBase();
115
		if (cdmBase.getId() == 0){
116
			if (cdmBase.isInstanceOf(IdentifiableEntity.class)){
117
				if (converter.requiredSourceNamespaces().contains(item.getNamespace())){
118
					state.addRelatedObject(item.getNamespace(), item.getSourceId(),  item.getCdmBase());
119
				}
120
			}
121
		}
122
	}
123

    
124

    
125
	@Override
126
	public TermUri getTerm() {
127
		return inStream.getTerm();
128
	}
129
	
130

    
131
}
(35-35/35)