Project

General

Profile

Download (9.94 KB) Statistics
| Branch: | Tag: | Revision:
1
<?php
2

    
3
/**
4
 * @file
5
 * Functions for handling CDM TaggedText arrays
6
 *
7
 *
8
 * @copyright
9
 *   (C) 2007-2018 EDIT
10
 *   European Distributed Institute of Taxonomy
11
 *   http://www.e-taxonomy.eu
12
 *
13
 *   The contents of this module are subject to the Mozilla
14
 *   Public License Version 1.1.
15
 * @see http://www.mozilla.org/MPL/MPL-1.1.html
16
 *
17
 * @author
18
 *   - Andreas Kohlbecker <a.kohlbecker@BGBM.org>
19
 */
20

    
21
function tagged_text_new($tag_type, $text = null){
22
  $tt = new stdClass();
23
  $tt->type = $tag_type;
24
  $tt->text = $text;
25
  return $tt;
26
}
27

    
28
/**
29
 * Walks the passed TaggedText array to find all elements which have a
30
 * TaggedText->entityReference. For each of these the taggedTexts is loaded
31
 * from the webservice and the original entry in the TaggedText array will be
32
 * replaced by the newly loaded array.
33
 *
34
 * @param array $taggedtxt
35
 *    The original TaggedText array
36
 * @param array $skiptags
37
 *    Optional list of tag names to skip
38
 * @return array
39
 *    The new tagged text with all TaggedText->entityReference objects expanded
40
 */
41
function cdm_tagged_text_expand_entity_references(array $taggedtxt, $skiptags = array()) {
42
  $tagged_text_expanded = array();
43
  foreach ($taggedtxt as $tt) {
44
    if (isset($tt->entityReference) && !in_array($tt->type, $skiptags)) {
45
      $base_uri = cdm_ws_base_uri($tt->entityReference->type);
46
      if($base_uri){
47
        $tagged_text_method = "/taggedText";
48
        if($base_uri == CDM_WS_NAME){
49
          $tagged_text_method = "/taggedName";
50
        }
51
        $referenced_tt = cdm_ws_get($base_uri . "/" . $tt->entityReference->uuid . $tagged_text_method);
52
        if($referenced_tt){
53
          $tagged_text_expanded = array_merge($tagged_text_expanded, $referenced_tt);
54
          continue;
55
        }
56
      }
57
    }
58
    // default case
59
    $tagged_text_expanded[] = $tt;
60
  }
61
  return $tagged_text_expanded;
62
}
63

    
64
/**
65
 * Converts an array of TaggedText items into corresponding html tags.
66
 *
67
 * Each item is provided with a class attribute which is set to the key of the
68
 * TaggedText item.
69
 *
70
 * Tagged text where the type starts with 'PLACEHOLDER_' will be added to the markup as plain text whereas the
71
 * taggedText->type wrapped in curly brackets: '{'. $tt->text . '}' is used as text.
72
 * see tagged_text_extract_secref()
73
 *
74
 * The algorithm of this functions is basically the same as for
75
 * eu.etaxonomy.cdm.strategy.cache.TaggedCacheHelper.createString(List<TaggedText> tags, HTMLTagRules htmlRules)
76
 *
77
 * @param array $taggedtxt
78
 *   Array with text items to convert.
79
 * @param array $skiptags
80
 *   Array of tag names to skip
81
 *
82
 * @return string
83
 *   The markup.
84
 */
85
function cdm_tagged_text_to_markup(array $taggedtxt, $skiptags = array(), $tag = 'span') {
86

    
87
  $out = '';
88
  $was_separator = false;
89
  $last_type = null;
90
  $i = 0;
91
  foreach ($taggedtxt as $tt) {
92
    if (!in_array($tt->type, $skiptags) && $tt->text) {
93
      if(isset($tt->entityReference)){
94
        $class_attr = $tt->type . " " . html_class_attribute_ref($tt->entityReference);
95
      } else {
96
        $class_attr = $tt->type;
97
      }
98
      $is_first = $i == 0;
99
      $is_separator = is_tagged_text_sepatator_type($tt->type);
100
      if(str_beginsWith($tt->type, 'PLACEHOLDER_')){
101
        $out .=  '{'. $tt->type . '}';
102
      } else {
103
        if(($last_type && $last_type != $tt->type) && $tag) {
104
          $out .= '</' . $tag . '>';
105
        }
106
        if((!$last_type || $last_type != $tt->type) && $tag){
107
          $out .= '<' . $tag . ' class="' . $class_attr . '">';
108
        }
109
        if(!$is_separator && !$was_separator && !$is_first){
110
          $out .= " ";
111
        }
112
        $out .= t('@text', array('@text' => $tt->text));
113
        $was_separator = $is_separator;
114
        $last_type = $tt->type;
115
      }
116
    }
117
    $i++;
118
  }
119
  return $out;
120
}
121

    
122
/**
123
 * Converts an array of TaggedText items into corresponding plain text string
124
 *
125
 * Each item is provided with a class attribute which is set to the key of the
126
 * TaggedText item.
127
 *
128
 * The algorithm of this functions is basically the same as for
129
 * eu.etaxonomy.cdm.strategy.cache.TaggedCacheHelper.createString(List<TaggedText> tags)
130
 *
131
 * @param array $taggedtxt
132
 *   Array with text items to convert.
133
 * @param array $skiptags
134
 *   Array of tag names to skip
135
 *
136
 * @return string
137
 *   The plain text
138
 */
139
function cdm_tagged_text_to_string(array $taggedtxt, $skiptags = array()) {
140

    
141
//  $out = '';
142
//  $was_separator = false;
143
//  $i = 0;
144
//  foreach ($taggedtxt as $tt) {
145
//    if (!in_array($tt->type, $skiptags) && $tt->text) {
146
//      $is_last = $i + 1 == count($taggedtxt);
147
//      $is_separator = is_tagged_text_sepatator_type($tt->type);
148
//      $glue = !$is_separator && !$was_separator && !$is_last ? ' ' : '';
149
//      $out .= t('@text', array('@text' => $tt->text)) . $glue;
150
//      $was_separator = $is_separator;
151
//    }
152
//    $i++;
153
//  }
154
  return cdm_tagged_text_to_markup($taggedtxt, $skiptags, null);
155
}
156

    
157
/**
158
 * See cdmlib: boolean eu.etaxonomy.cdm.strategy.cache.TagEnum.isSeparator();
159
 *
160
 * @return bool
161
 */
162
function is_tagged_text_sepatator_type($tagged_text_type){
163
  static $separator_names = array('separator', 'postSeparator');
164
  $result = array_search($tagged_text_type, $separator_names) !== false;
165
  return $result;
166
}
167

    
168

    
169
/**
170
 * Finds the text tagged with $tag_type in an array of taggedText instances.
171
 *
172
 *
173
 * @param array $taggedtxt
174
 *   Array with text items.
175
 * @param array $include_tag_types
176
 *   Array of the tag types for which to find text items in the $taggedtxt array, or NULL
177
 *   to return all texts.
178
 *
179
 * @return array
180
 *   An array with the texts mapped by $tag_type.
181
 */
182
function cdm_tagged_text_values(array $taggedtxt, $include_tag_types = NULL) {
183
  $tokens = array();
184
  if (!empty($taggedtxt)) {
185
    foreach ($taggedtxt as $tagtxt) {
186
      if ($include_tag_types === NULL || array_search($tagtxt->type, $include_tag_types) !== false) {
187
        $tokens[] = $tagtxt->text;
188
      }
189
    }
190
  }
191
  return $tokens;
192
}
193

    
194
/**
195
 * Preprocess the taggedTitle arrays.
196
 *
197
 * Step 1: Turns 'newly' introduces tag types ("hybridSign")
198
 * into tag type "name"
199
 *
200
 * Step 2: Two taggedTexts which have the same type and which have
201
 * a separator between them are merged together.
202
 *
203
 * @param array $taggedTextList
204
 *    An array of TaggedText objects
205
 */
206
function normalize_tagged_text(&$taggedTextList) {
207

    
208
  if (is_array($taggedTextList)) {
209

    
210
    // First pass: rename.
211
    for ($i = 0; $i < count($taggedTextList); $i++) {
212

    
213
      if ($taggedTextList[$i]->type == "hybridSign") {
214
        $taggedTextList[$i]->type = "name";
215
      }
216
    }
217

    
218
    // Second pass: resolve separators.
219
    $taggedNameListNew = array();
220
    for ($i = 0; $i < count($taggedTextList); $i++) {
221

    
222
      // elements of the same type concatenated by a separator should be merged together
223
      if (isset($taggedTextList[$i + 2]) && $taggedTextList[$i + 1]->type == "separator" && $taggedTextList[$i]->type == $taggedTextList[$i + 2]->type) {
224
        $taggedName = clone $taggedTextList[$i];
225
        $taggedName->text = $taggedName->text . $taggedTextList[$i + 1]->text . $taggedTextList[$i + 2]->text;
226
        $taggedNameListNew[] = $taggedName;
227
        ++$i;
228
        ++$i;
229
        continue;
230
      }
231
      // no special handling
232
      $taggedNameListNew[] = $taggedTextList[$i];
233

    
234
    }
235
    $taggedTextList = $taggedNameListNew;
236
  }
237
}
238

    
239
/**
240
 * Extracts the tagged text for sec references with separator and citation detail from a tagged text array.
241
 * @param $tagged_text
242
 *    The tagged text to operate on
243
 * @param string $ref_tag_type
244
 *    The tagtype for a secreference is "secReference", but "relSecReference" is also used in case of relationships.
245
 * @param bool $replace_with_placeholder
246
 *    Indicates the method to add a empty placeholder tagged text alement as relpacement for the extrated tagged text
247
 *    elements.
248
 * @return array
249
 */
250
function tagged_text_extract_secref(&$tagged_text, $ref_tag_type = "secReference", $replace_with_placeholder = false) {
251

    
252
  $extracted_tt = array();
253
  if (is_array($tagged_text)) {
254
    $extract_pos = null;
255
    for ($i = 0; $i < count($tagged_text) - 1; $i++) {
256
      if ($tagged_text[$i + 1]->type == $ref_tag_type && $tagged_text[$i]->type == "separator"){
257
        $extracted_tt[0] = $tagged_text[$i];
258
        $extracted_tt[1] = $tagged_text[$i + 1];
259

    
260
        if($replace_with_placeholder){
261
          // text must not be null, see cdm_tagged_text_to_markup()
262
          $tagged_text[$i] = tagged_text_new("PLACEHOLDER_" . $ref_tag_type, "PLACEHOLDER_" . $ref_tag_type);
263
        } else {
264
          unset($tagged_text[$i]);
265
        }
266
        unset($tagged_text[$i + 1]);
267
        // also get the microreference which could be in $tagged_text[$i + 3]
268
        if(isset($tagged_text[$i + 3])  && $tagged_text[$i + 2]->type == "separator" && $tagged_text[$i + 3]->type == $ref_tag_type){
269
          $extracted_tt[2] = $tagged_text[$i + 2];
270
          $extracted_tt[3] = $tagged_text[$i + 3];
271
          unset($tagged_text[$i + 2]);
272
          unset($tagged_text[$i + 3]);
273
        }
274
        break;
275
      }
276
    }
277
  }
278
  $tagged_text = array_values($tagged_text); // re-index array to make it continuous again
279
  return $extracted_tt;
280
}
281

    
282
function tagged_text_extract_nomstatus(&$tagged_text) {
283

    
284
  $extracted_tt = array();
285
  if (is_array($tagged_text)) {
286
    for ($i = 0; $i < count($tagged_text) - 1; $i++) {
287
      if ($tagged_text[$i]->type == "nomStatus"){
288
        $extracted_tt[] = $tagged_text[$i];
289
        if(isset($tagged_text[$i + 1]) && $tagged_text[$i + 1]->type == "postSeparator"){
290
          $extracted_tt[] = $tagged_text[$i + 1];
291
          unset($tagged_text[$i + 1]);
292
        }
293
        if ($tagged_text[$i - 1]->type == "separator"){
294
          array_unshift($extracted_tt, $tagged_text[$i - 1]);
295
          unset($tagged_text[$i - 1]);
296
        }
297
        unset($tagged_text[$i]);
298
        break;
299
      }
300
    }
301
  }
302
  return $extracted_tt;
303
}
304

    
305
function find_tagged_text_elements($taggedTextList, $type){
306
  $matching_elements = array();
307
  if (is_array($taggedTextList)) {
308
    for ($i = 0; $i < count($taggedTextList) - 1; $i++) {
309
      if($taggedTextList[$i]->type == $type){
310
        $matching_elements[] = $taggedTextList[$i];
311
      }
312
    }
313
  }
314
  return $matching_elements;
315
}
(9-9/12)