AtlasOfLivingAustralia
diff --git a/‎ansible/biocache-service-pipelines.yml
+9 b/‎ansible/biocache-service-pipelines.yml
+9
diff --git a/‎ansible/hadoop.yml
+4 b/‎ansible/hadoop.yml
+4
diff --git a/‎ansible/library/tomcat9_connector
+10-2 b/‎ansible/library/tomcat9_connector
+10-2
diff --git a/‎ansible/library/tomcat_connector
+10-2 b/‎ansible/library/tomcat_connector
+10-2
diff --git a/‎ansible/pipelines.yml
+27 b/‎ansible/pipelines.yml
+27
diff --git a/‎ansible/roles/biocache-hub/templates/config/grouped_facets_ala.json
+5 b/‎ansible/roles/biocache-hub/templates/config/grouped_facets_ala.json
+5
diff --git a/‎ansible/roles/biocache3-db/files/cassandra/cassandra-schema.txt
+122 b/‎ansible/roles/biocache3-db/files/cassandra/cassandra-schema.txt
+122
diff --git a/‎ansible/roles/biocache3-db/files/cassandra/cassandra3-schema.txt
+1 b/‎ansible/roles/biocache3-db/files/cassandra/cassandra3-schema.txt
+1
diff --git a/‎ansible/roles/biocache3-db/handlers/main.yml
+8 b/‎ansible/roles/biocache3-db/handlers/main.yml
+8
diff --git a/‎ansible/roles/biocache3-db/tasks/main.yml
+33 b/‎ansible/roles/biocache3-db/tasks/main.yml
+33
@@ -0,0 +1,9 @@
+- hosts: biocache-service-clusterdb
+  roles:
+    - common
+    - java
+    - { role: tomcat, tomcat: tomcat9 }
+    - webserver
+    - biocache3-properties
+    - biocache3-service
+    - logger-client
@@ -0,0 +1,4 @@
+- hosts: hadoop
+  roles:
+    - java
+    - hadoop
@@ -33,6 +33,10 @@ options:
       - the port to use for connector
       - will use default port for protocol (8080 for HTTP or 8009 for AJP) if omitted
     required: false
+  max_post_size:
+    description:
+      - max size for a post request
+      - defaults to 2097152 (2MB)
   relaxed_query_chars:
     description:
       - A string containing the chars to relax to avoid requiring URL encoding
@@ -128,7 +132,7 @@ def default_port(name):
     return 8080 if name == "HTTP/1.1" else 8009
 
 
-def add_connector(aug, protocol, service, bind_addr, port, connection_timeout=20000, uri_encoding="UTF-8", redirect_port=443, relaxed_query_chars=""):
+def add_connector(aug, protocol, service, bind_addr, port, max_post_size, connection_timeout=20000, uri_encoding="UTF-8", redirect_port=443, relaxed_query_chars=""):
 
     aug.defvar("service", "/files/server.xml/Server/Service[#attribute/name=\"%(service)s\"]" % locals())
 
@@ -137,6 +141,8 @@ def add_connector(aug, protocol, service, bind_addr, port, connection_timeout=20
 
     aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/port" % locals(), str(port))
 
+    aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/maxPostSize" % locals(), str(max_post_size))
+
     aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/protocol" % locals(), protocol)
 
     aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/address" % locals(), bind_addr)
@@ -167,6 +173,7 @@ def main():
             bind_addr=dict(default="127.0.0.1"),
             relaxed_query_chars=dict(default=""),
             port=dict(type="int"),
+            max_post_size=dict(default=2097152, type="int"),
             connection_timeout=dict(default=20000, type="int"),
             uri_encoding=dict(default="UTF-8"),
             redirect_port=dict(default=443, type="int"),
@@ -185,6 +192,7 @@ def main():
     bind_addr = module.params["bind_addr"]
     relaxed_query_chars = module.params["relaxed_query_chars"]
     port = module.params["port"]
+    max_post_size = module.params["max_post_size"]
     connection_timeout = module.params["connection_timeout"]
     uri_encoding = module.params["uri_encoding"]
     redirect_port = module.params["redirect_port"]
@@ -209,7 +217,7 @@ def main():
         if state == "absent":
             remove_connector(aug, name, port)
         else:
-            add_connector(aug, name, service, bind_addr, port, connection_timeout, uri_encoding, redirect_port, relaxed_query_chars)
+            add_connector(aug, name, service, bind_addr, port, max_post_size, connection_timeout, uri_encoding, redirect_port, relaxed_query_chars)
 
         try:
             aug.save()
 
@@ -33,6 +33,10 @@ options:
       - the port to use for connector
       - will use default port for protocol (8080 for HTTP or 8009 for AJP) if omitted
     required: false
+  max_post_size:
+    description:
+      - max size for a post request
+      - defaults to 2097152 (2MB)
   relaxed_query_chars:
     description:
       - A string containing the chars to relax to avoid requiring URL encoding
@@ -128,7 +132,7 @@ def default_port(name):
     return 8080 if name == "HTTP/1.1" else 8009
 
 
-def add_connector(aug, protocol, service, bind_addr, port, connection_timeout=20000, uri_encoding="UTF-8", redirect_port=443, relaxed_query_chars=""):
+def add_connector(aug, protocol, service, bind_addr, port, max_post_size, connection_timeout=20000, uri_encoding="UTF-8", redirect_port=443, relaxed_query_chars=""):
 
     aug.defvar("service", "/files/server.xml/Server/Service[#attribute/name=\"%(service)s\"]" % locals())
 
@@ -137,6 +141,8 @@ def add_connector(aug, protocol, service, bind_addr, port, connection_timeout=20
 
     aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/port" % locals(), str(port))
 
+    aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/maxPostSize" % locals(), str(max_post_size))
+
     aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/protocol" % locals(), protocol)
 
     aug.set("$service/Connector[#attribute/port=\"%(port)s\"]/#attribute/address" % locals(), bind_addr)
@@ -168,6 +174,7 @@ def main():
             bind_addr=dict(default="127.0.0.1"),
             relaxed_query_chars=dict(default=""),
             port=dict(type="int"),
+            max_post_size=dict(default=2097152, type="int"),
             connection_timeout=dict(default=20000, type="int"),
             uri_encoding=dict(default="UTF-8"),
             redirect_port=dict(default=443, type="int"),
@@ -186,6 +193,7 @@ def main():
     bind_addr = module.params["bind_addr"]
     relaxed_query_chars = module.params["relaxed_query_chars"]
     port = module.params["port"]
+    max_post_size = module.params["max_post_size"]
     connection_timeout = module.params["connection_timeout"]
     uri_encoding = module.params["uri_encoding"]
     redirect_port = module.params["redirect_port"]
@@ -210,7 +218,7 @@ def main():
         if state == "absent":
             remove_connector(aug, name, port)
         else:
-            add_connector(aug, name, service, bind_addr, port, connection_timeout, uri_encoding, redirect_port, relaxed_query_chars)
+            add_connector(aug, name, service, bind_addr, port, max_post_size, connection_timeout, uri_encoding, redirect_port, relaxed_query_chars)
 
         try:
             aug.save()
 
@@ -0,0 +1,27 @@
+- hosts: all
+  roles:
+    - java
+
+- hosts: all
+  roles:
+    - i18n
+
+- hosts: hadoop
+  roles:
+    - hadoop
+
+- hosts: spark
+  roles:
+    - spark
+
+- hosts: jenkins
+  roles:
+    - jenkins-simple
+
+- hosts: pipelines
+  roles:
+    - pipelines
+
+- hosts: pipelines_jenkins
+  roles:
+    - pipelines_jenkins
@@ -233,6 +233,11 @@
             {  
                 "sort":"index",
                 "field":"occurrence_status"
+            },
+            {
+                "sort": "index",
+                "description": "Content types",
+                "field": "contentTypes"
             }
         ]
     },
 
@@ -0,0 +1,122 @@
+/* Creates the cassandra 0.7.x schema necessary for biocache-store 
+   Run this file using:
+   ./cassandra-cli --host localhost --batch < create_cass_schema.txt
+*/
+
+/* all keyspaces are created using the ByteOrderPreservingPartitioner see the cassandra.yaml file */
+create keyspace occ;
+
+use occ;
+
+create column family occ with comparator=UTF8Type and default_validation_class=UTF8Type
+and comment='The column family for occurrence records' 
+and key_validation_class = 'UTF8Type' 
+and compaction_strategy=LeveledCompactionStrategy
+and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+and column_metadata=[{column_name: portalId, validation_class: UTF8Type, index_type: KEYS},
+{column_name: uuid, validation_class: UTF8Type, index_type: KEYS}];
+
+create column family loc with comparator=UTF8Type 
+and default_validation_class=UTF8Type 
+and key_validation_class = 'UTF8Type' 
+and comment ='The column family for locations'
+and compaction_strategy=LeveledCompactionStrategy
+and compaction_strategy_options = {'sstable_size_in_mb' : '200'};
+
+create column family attr with comparator=UTF8Type 
+and default_validation_class=UTF8Type 
+and key_validation_class = 'UTF8Type'
+and comment='The column family for attribution tracking' 
+and compaction_strategy=LeveledCompactionStrategy;
+
+create column family taxon with comparator=UTF8Type 
+and default_validation_class=UTF8Type 
+and key_validation_class = 'UTF8Type'
+and comment='The column family for taxon profile information' 
+and compaction_strategy=LeveledCompactionStrategy
+and compaction_strategy_options = {'sstable_size_in_mb' : '200'};
+
+
+/* update column family loc with comparator=UTF8Type and keys_cached=1.0 */
+
+create column family qa with comparator=UTF8Type 
+and default_validation_class=UTF8Type 
+and key_validation_class = 'UTF8Type'
+and comment='The column family for quality assertions'
+and column_metadata=[{column_name: userId, validation_class: UTF8Type,  index_type: KEYS},
+{column_name:code, validation_class: UTF8Type, index_type: KEYS}] 
+and compaction_strategy=LeveledCompactionStrategy
+and compaction_strategy_options = {'sstable_size_in_mb' : '200'};
+
+create column family dellog  
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'  
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to log deleted information';
+
+create column family duplicates  
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'  
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to store information about duplicates';
+
+create column family occ_duplicates  
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'  
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to store information about duplicates';
+
+create column family upload
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to store information about dynamically uploaded datasets';
+
+create column family outliers with comparator = 'UTF8Type' and default_validation_class = 'UTF8Type'
+and comment='The column family for occurrence records' and gc_grace=2000;
+
+create column family occ_outliers with comparator = 'UTF8Type' and default_validation_class = 'UTF8Type'
+and comment='The column family for occurrence records' and gc_grace=2000;
+
+update column family outliers with comparator = 'UTF8Type' and default_validation_class = 'UTF8Type'
+and column_metadata=[{column_name: portalId, validation_class: UTF8Type, index_type: KEYS},
+{column_name: uuid, validation_class: UTF8Type, index_type: KEYS}];
+
+update column family occ_outliers with comparator = 'UTF8Type' and default_validation_class = 'UTF8Type'
+and column_metadata=[{column_name: portalId, validation_class: UTF8Type, index_type: KEYS},
+{column_name: uuid, validation_class: UTF8Type, index_type: KEYS}];
+
+
+create column family queryassert  
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'  
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to store information about query based assertions';
+
+update column family queryassert with column_metadata=[{column_name: uuid, validation_class: UTF8Type, index_type: KEYS}];
+
+create column family distribution_outliers
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to store information about expert distribution outlier records';
+  
+create column family qid
+  with comparator = 'UTF8Type'
+  and default_validation_class = 'UTF8Type'
+  and key_validation_class = 'UTF8Type'
+  and compaction_strategy = 'org.apache.cassandra.db.compaction.LeveledCompactionStrategy'
+  and compaction_strategy_options = {'sstable_size_in_mb' : '200'}
+  and comment = 'The column family to store information about stored query requests (qid)';
@@ -0,0 +1 @@
+CREATE KEYSPACE IF NOT EXISTS biocache WITH replication = {'class': 'SimpleStrategy', 'replication_factor': '2'}  AND durable_writes = true;
@@ -0,0 +1,8 @@
+- name: restart cassandra
+  service: name=cassandra state=restarted enabled="yes"
+
+- name: configure cassandra
+  shell: 'cassandra-cli < /tmp/cassandra-schema.txt'
+
+- name: configure cassandra
+  shell: 'cqlsh < /tmp/cassandra3-schema.txt'
@@ -0,0 +1,33 @@
+- include: ../../common/tasks/setfacts.yml
+
+- name: disable swap
+  shell: "swapoff --all"
+  # This fails in LXC containers, see:
+  # https://bugs.launchpad.net/ubuntu/+source/lxc/+bug/930652
+  when: ansible_virtualization_type != 'lxc'
+  tags:
+    - biocache_db
+
+- name: copy transient files to tmp (schemas etc)
+  copy: src={{item}} dest=/tmp
+  with_items:
+    - cassandra/cassandra-schema.txt
+    - cassandra/cassandra3-schema.txt
+  tags:
+    - biocache_db
+
+- name: restart cassandra
+  service: name=cassandra state=restarted enabled="yes"
+  tags:
+    - biocache_db
+
+- name: ensure cassandra 1.x is running
+  wait_for: port=9160 delay=30
+  when: use_cassandra3 is not defined
+  tags:
+    - biocache_db
+
+- name: create schema  (cassandra 3)
+  shell: "cqlsh < /tmp/cassandra3-schema.txt"
+  tags:
+    - biocache_db
-Original file line number
+Diff line change
 +- hosts: hadoop
 +  roles:
 +    - java
 +    - hadoop
Original file line number	Diff line number	Diff line change
`@@ -233,6 +233,11 @@`
`233`	`233`	`{`
`234`	`234`	`"sort":"index",`
`235`	`235`	`"field":"occurrence_status"`
	`236`	`+ },`
	`237`	`+ {`
	`238`	`+ "sort": "index",`
	`239`	`+ "description": "Content types",`
	`240`	`+ "field": "contentTypes"`
`236`	`241`	`}`
`237`	`242`	`]`
`238`	`243`	`},`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+CREATE KEYSPACE IF NOT EXISTS biocache WITH replication = {'class': 'SimpleStrategy', 'replication_factor': '2'} AND durable_writes = true;`