DatasetServiceImpl.java

/*
 * Copyright 2018 Global Crop Diversity Trust
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.genesys.server.service.impl;

import static org.genesys.server.model.dataset.QDataset.dataset;
import static org.genesys.server.model.dataset.QDatasetCreator.datasetCreator;

import java.io.BufferedOutputStream;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.OutputStream;
import java.nio.file.Path;
import java.nio.file.Paths;
import java.time.Instant;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Locale;
import java.util.Map;
import java.util.Objects;
import java.util.Set;
import java.util.TreeSet;
import java.util.UUID;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.stream.Collectors;

import javax.persistence.EntityManager;
import javax.persistence.PersistenceContext;

import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.StringUtils;
import org.genesys.blocks.security.model.AclSid;
import org.genesys.blocks.security.serialization.Permissions;
import org.genesys.blocks.security.service.CustomAclService;
import org.genesys.filerepository.FolderNotEmptyException;
import org.genesys.filerepository.InvalidRepositoryFileDataException;
import org.genesys.filerepository.InvalidRepositoryPathException;
import org.genesys.filerepository.NoSuchRepositoryFileException;
import org.genesys.filerepository.model.RepositoryFile;
import org.genesys.filerepository.model.RepositoryFolder;
import org.genesys.filerepository.service.RepositoryService;
import org.genesys.server.component.aspect.NotifyForReview;
import org.genesys.server.component.aspect.NotifyOnPublished;
import org.genesys.server.component.security.AsAdminInvoker;
import org.genesys.server.component.security.SecurityUtils;
import org.genesys.server.exception.InvalidApiUsageException;
import org.genesys.server.exception.NotFoundElement;
import org.genesys.server.exception.SearchException;
import org.genesys.server.model.Partner;
import org.genesys.server.model.PublishState;
import org.genesys.server.model.UserRole;
import org.genesys.server.model.dataset.Dataset;
import org.genesys.server.model.dataset.DatasetAccessionRef;
import org.genesys.server.model.dataset.DatasetCreator;
import org.genesys.server.model.dataset.DatasetLang;
import org.genesys.server.model.dataset.DatasetLocation;
import org.genesys.server.model.dataset.DatasetVersions;
import org.genesys.server.model.dataset.QDataset;
import org.genesys.server.model.dataset.QDatasetAccessionRef;
import org.genesys.server.model.filters.DatasetFilter;
import org.genesys.server.model.genesys.Accession;
import org.genesys.server.model.genesys.QAccession;
import org.genesys.server.model.impl.FaoInstitute;
import org.genesys.server.model.traits.Descriptor;
import org.genesys.server.model.traits.QDescriptor;
import org.genesys.server.persistence.DatasetLangRepository;
import org.genesys.server.persistence.dataset.DatasetAccessionRefRepository;
import org.genesys.server.persistence.dataset.DatasetCreatorRepository;
import org.genesys.server.persistence.dataset.DatasetLocationRepository;
import org.genesys.server.persistence.dataset.DatasetRepository;
import org.genesys.server.persistence.dataset.DatasetVersionsRepository;
import org.genesys.server.persistence.traits.DescriptorRepository;
import org.genesys.server.service.AmphibianService;
import org.genesys.server.service.DatasetService;
import org.genesys.server.service.DatasetTranslationService;
import org.genesys.server.service.DescriptorService;
import org.genesys.server.service.DescriptorTranslationService;
import org.genesys.server.service.DownloadService;
import org.genesys.server.service.ElasticsearchService;
import org.genesys.server.service.TranslatorService;
import org.genesys.server.service.TranslatorService.FormattedText;
import org.genesys.server.service.TranslatorService.TextFormat;
import org.genesys.server.service.VersionManager;
import org.genesys.server.service.filter.AccessionFilter;
import org.genesys.server.service.worker.AccessionRefMatcher;
import org.genesys.util.JPAUtils;
import org.genesys.util.LoggerHelper;
import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.beans.factory.annotation.Value;
import org.springframework.cache.annotation.CacheEvict;
import org.springframework.cache.annotation.Cacheable;
import org.springframework.context.annotation.Lazy;
import org.springframework.core.task.TaskExecutor;
import org.springframework.dao.ConcurrencyFailureException;
import org.springframework.data.domain.Page;
import org.springframework.data.domain.PageImpl;
import org.springframework.data.domain.PageRequest;
import org.springframework.data.domain.Pageable;
import org.springframework.data.domain.Sort;
import org.springframework.data.jpa.repository.support.Querydsl;
import org.springframework.security.access.prepost.PostAuthorize;
import org.springframework.security.access.prepost.PreAuthorize;
import org.springframework.security.acls.domain.BasePermission;
import org.springframework.stereotype.Component;
import org.springframework.stereotype.Service;
import org.springframework.transaction.annotation.Isolation;
import org.springframework.transaction.annotation.Propagation;
import org.springframework.transaction.annotation.Transactional;
import org.springframework.validation.annotation.Validated;
import org.springframework.web.multipart.MultipartFile;

import com.google.common.collect.Lists;
import com.google.common.collect.Sets;
import com.querydsl.core.BooleanBuilder;
import com.querydsl.core.types.Predicate;
import com.querydsl.core.types.dsl.PathBuilder;
import com.querydsl.core.types.dsl.PathBuilderFactory;
import com.querydsl.jpa.JPAExpressions;
import com.querydsl.jpa.JPQLQuery;
import com.querydsl.jpa.impl.JPAQueryFactory;
import com.vdurmont.semver4j.SemverException;

import lombok.extern.slf4j.Slf4j;

/**
 * The Class DatasetServiceImpl.
 */
@Service
@Transactional(readOnly = true)
@Validated
@Slf4j
public class DatasetServiceImpl  extends FilteredTranslatedCRUDServiceImpl<
	Dataset, DatasetLang, DatasetTranslationService.TranslatedDataset, DatasetFilter, DatasetRepository>
	implements DatasetService {

	/** The dataset versions repository. */
	@Autowired
	private DatasetVersionsRepository datasetVersionsRepository;

	/** The dataset creator repository. */
	@Autowired
	private DatasetCreatorRepository datasetCreatorRepository;

	/** The location repository. */
	@Autowired
	private DatasetLocationRepository locationRepository;

	@Autowired
	private DatasetAccessionRefRepository accessionRefRepository;

	/** The file repo service. */
	@Autowired
	private RepositoryService repositoryService;

	@Autowired
	private CustomAclService aclService;

	/** The securityUtils. */
	@Autowired
	private SecurityUtils securityUtils;

	/** Execute code as admin */
	@Autowired
	protected AsAdminInvoker asAdminInvoker;

	/** The download service. */
	@Autowired
	private DownloadService downloadService;

	/** The descriptor service. */
	@Autowired
	private DescriptorService descriptorService;

	/** The descriptor repository. */
	@Autowired
	private DescriptorRepository descriptorRepository;

	/** The file repository path. */
	@Value("${file.repository.datasets.folder}")
	public String datasetRepositoryPath;

	@Autowired
	private TaskExecutor taskExecutor;

	@Autowired
	private AccessionRefMatcher accessionRefMatcher;

	@PersistenceContext
	private EntityManager entityManager;

	@Autowired
	private VersionManager versionManager;

	@Autowired(required = false)
	private ElasticsearchService elasticsearchService;

	@Autowired
	private JPAQueryFactory jpaQueryFactory;

	@Autowired
	@Lazy
	private AmphibianService amphibianService;

	private Comparator<DatasetAccessionRef> distinctAcceRefsComparator;

	@Autowired
	private DescriptorTranslationService descriptorTranslationService;

	@Autowired(required = false)
	private TranslatorService translatorService;

	@Override
	public void afterPropertiesSet() throws Exception {
		distinctAcceRefsComparator = Comparator
			.comparing((DatasetAccessionRef ref) -> ref.getDataset().getId())
			.thenComparing(DatasetAccessionRef::getInstCode)
			.thenComparing(DatasetAccessionRef::getGenus)
			.thenComparing(DatasetAccessionRef::getAcceNumb);
	}

	@Component(value = "DatasetTranslationSupport")
	protected static class DatasetTranslationSupport
		extends BaseTranslationSupport<
		Dataset, DatasetLang, DatasetTranslationService.TranslatedDataset, DatasetFilter, DatasetLangRepository>
		implements DatasetTranslationService {

		@Override
		@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#source.entity, 'write')")
		public DatasetLang create(DatasetLang source) {
			return super.create(source);
		}

		@Override
		@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#target.entity, 'write')")
		public DatasetLang update(DatasetLang updated, DatasetLang target) {
			return super.update(updated, target);
		}

		@Override
		@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#source.entity, 'write')")
		public DatasetLang remove(DatasetLang source) {
			return super.remove(source);
		}
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#source.owner, 'write')")
	public Dataset createFast(Dataset source) {
		return create(source);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#source.owner, 'write')")
	public Dataset create(final Dataset source) {
		log.info("Create Dataset. Input data {}", source);
		final DatasetVersions datasetVersions = new DatasetVersions();
		datasetVersions.setCurrentVersion(null);
		datasetVersionsRepository.save(datasetVersions);

		Dataset dataset = new Dataset();
		dataset.setUuid(source.getUuid());
		dataset.setVersions(datasetVersions);
		dataset.setCurrent(null);
		copyValues(dataset, source);
		dataset.setState(PublishState.DRAFT);
		dataset.setOwner(source.getOwner());
		dataset.setVersionTag(source.getVersionTag());
		dataset.setDescriptors(new ArrayList<>());
		dataset.setRepositoryFiles(new ArrayList<>());
		dataset.setCreators(new ArrayList<>());
		dataset.setLocations(new ArrayList<>());
		dataset.setCrops(source.getCrops());
		dataset.setOriginalLanguageTag(source.getOriginalLanguageTag());

		copyDescriptors(dataset, source.getDescriptors());

		dataset = repository.save(dataset);

		// Make dataset publicly not-readable
		aclService.makePubliclyReadable(dataset, false);

		// Make dataset folder
		ensureDatasetFolder(dataset);

		// Grant all permissions to the Partner's SID
		final AclSid sid = aclService.ensureAuthoritySid(dataset.getOwner().getAuthorityName());
		aclService.setPermissions(dataset, sid, new Permissions().grantAll());

		return dataset;
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#target, 'write')")
	public Dataset update(Dataset updated, Dataset target) {
		copyValues(target, updated);
		target.setState(PublishState.DRAFT);

		return lazyLoad(repository.save(target));
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR')")
	public Dataset forceUpdate(Dataset updated) {
		var target = get(updated.getId());
		log.info("Force update Dataset. Input data {}", updated);

		if (updated.getOwner() != null && !target.getOwner().getUuid().equals(updated.getOwner().getUuid())) {
			throw new InvalidApiUsageException("Dataset owner can't be changed");
		}
		copyValues(target, updated);

		return repository.save(target);
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#target, 'write')")
	public Dataset updateFast(Dataset updated, Dataset target) {
		target = getUnpublishedDataset(target);
		log.info("Update Dataset. Input data {}", updated);

		if (updated.getOwner() != null && !target.getOwner().equals(updated.getOwner())) {
			throw new InvalidApiUsageException("Dataset owner can't be changed");
		}
		copyValues(target, updated);
		target.setState(PublishState.DRAFT);

		return repository.save(target);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#input, 'write')")
	public Dataset update(final Dataset input) {
		final Dataset dataset = getUnpublishedDataset(input);
		log.info("Update Dataset. Input data {}", input);

		if (input.getOwner() != null && !dataset.getOwner().equals(input.getOwner())) {
			throw new InvalidApiUsageException("Dataset owner can't be changed");
		}

		return update(input, dataset);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset setAccessionRefs(Dataset dataset, final Collection<DatasetAccessionRef> accessionRefs) {
		dataset = getUnpublishedDataset(dataset);
		log.info("Set accessions to Dataset {}. Input accessions {}", dataset.getUuid(), accessionRefs.size());

		deleteAccessionRefs(dataset);
		return addAccessionRefs(dataset, accessionRefs);
	}

	private void deleteAccessionRefs(Dataset dataset) {
		var removed = accessionRefRepository.deleteByList(dataset);
		log.warn("Removed {} accessionRefs from Dataset {}", removed, dataset.getUuid());
		dataset.getAccessionRefs().clear();
		log.warn("Cleared Dataset list");
		dataset.setAccessionCount(0);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public Dataset addDescriptors(Dataset dataset, final Descriptor... descriptors) {
		dataset = getUnpublishedDataset(dataset);

		log.info("Add descriptor to Dataset {}. Input descriptors {}", dataset, descriptors);
		final Set<UUID> descriptorUuids = dataset.getDescriptors().stream().map(descriptor -> descriptor.getUuid()).collect(Collectors.toSet());

		for (final Descriptor inputDescriptor : descriptors) {
			if (descriptorUuids.contains(inputDescriptor.getUuid())) {
				log.warn("Current Dataset already contains descriptor, ignoring");
			} else {
				dataset.getDescriptors().add(inputDescriptor);
				descriptorUuids.add(inputDescriptor.getUuid());
			}
		}
		// System.err.println("Processing done.");
		dataset = repository.save(dataset);
		// System.err.println("Saving done.");
		dataset = lazyLoad(dataset);
		// System.err.println("Lazy loading done.");
		return dataset;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public Dataset removeDescriptors(Dataset dataset, final Descriptor... descriptorsToRemove) {
		dataset = getUnpublishedDataset(dataset);
		log.info("Remove descriptors {} of dataset {}.", descriptorsToRemove, dataset);

		// Which UUIDs to remove?
		final Set<UUID> descriptorUuids = Arrays.stream(descriptorsToRemove).map(descriptor -> descriptor.getUuid()).collect(Collectors.toSet());

		// Keep descriptors that are not in the list
		dataset.setDescriptors(dataset.getDescriptors().stream().filter(descriptor -> !descriptorUuids.contains(descriptor.getUuid())).collect(Collectors.toList()));

		removeAmphibianObservations(dataset, List.of(descriptorsToRemove));

		return lazyLoad(repository.save(dataset));
	}

	private void removeAmphibianObservations(Dataset dataset, final Collection<Descriptor> descriptors) {
		if (CollectionUtils.isEmpty(descriptors)) return;
		if (amphibianService != null) {
			for (var descriptor : descriptors) {
				try {
					amphibianService.removeObservations(dataset, descriptor);
				} catch (Throwable e) {
					log.warn("Could not remove observations for {} from Amphibian dataset {}: {}", descriptor, dataset, e.getMessage());
				}
			}
		}
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public Dataset updateDescriptors(Dataset dataset, final List<Descriptor> descriptors) {
		dataset = getUnpublishedDataset(dataset);
		log.info("Update descriptors for Dataset {}. Input descriptors {}", dataset, descriptors);

		var removedDescriptors = dataset.getDescriptors().stream().filter(d -> !descriptors.contains(d)).collect(Collectors.toList());
		log.warn("Removed descriptors: {}", removedDescriptors);
		removeAmphibianObservations(dataset, removedDescriptors);

		dataset.getDescriptors().clear();
		copyDescriptors(dataset, descriptors);

		return lazyLoad(repository.save(dataset));
	}

	@Override
	@PostAuthorize("returnObject==null || returnObject.published || hasRole('ADMINISTRATOR') || hasPermission(returnObject, 'read')")
	public Dataset getDataset(UUID uuid) {
		return repository.findByUuid(uuid);
	}

	@Override
	@PostAuthorize("returnObject==null || returnObject.published || hasRole('ADMINISTRATOR') || hasPermission(returnObject, 'read')")
	public Dataset getDataset(UUID uuid, Integer version) {
		final Dataset dataset = repository.findByUuid(uuid);

		if (dataset == null) {
			throw new NotFoundElement("Record not found by uuid=" + uuid);
		}

		if (version != null && !dataset.getVersion().equals(version)) {
			log.warn("Dataset versions don't match anymore");
			throw new ConcurrencyFailureException("Object version changed to " + dataset.getVersion() + ", you provided " + version);
		}
		return dataset;
	}

	@Override
	public void writeXlsxMCPD(Dataset dataset, OutputStream outputStream) throws IOException {
		PathBuilder<Accession> builder = new PathBuilderFactory().create(Accession.class);
		Querydsl querydsl = new Querydsl(entityManager, builder);
		JPQLQuery<Long> queryAccessionId = querydsl.createQuery(QDatasetAccessionRef.datasetAccessionRef)
			// select id only
			.select(QDatasetAccessionRef.datasetAccessionRef.accession().id)
			// order by id
			.orderBy(QDatasetAccessionRef.datasetAccessionRef.accession().id.asc());

		// Apply where
		queryAccessionId.where(QDatasetAccessionRef.datasetAccessionRef.list().eq(dataset));

		downloadService.writeXlsxMCPD(queryAccessionId, outputStream, "", "/datasets/" + dataset.getUuid());
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("(hasRole('ADMINISTRATOR') || hasPermission(#source, 'write')) && #source.published")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset createNewVersion(Dataset source) {
		source = getDataset(source);

		final Dataset dataset = new Dataset();
		copyValues(dataset, source);
		try {
			dataset.setVersionTag(versionManager.nextMajor(source.getVersionTag()));
		} catch (SemverException e) {
			dataset.setVersionTag(source.getVersionTag() + ".1");
		}
		dataset.setState(PublishState.DRAFT);
		dataset.setCurrent(null);
		dataset.setUuid(null);
		dataset.setVersions(source.getVersions());

		// Copy descriptors
		dataset.setDescriptors(new ArrayList<>());
		copyDescriptors(dataset, source.getDescriptors());

		Dataset saved = repository.save(dataset);

		// copy accessionRefs
		saved = copyAccessionRefs(saved, source.getAccessionRefs());

		// Copy creators
		copyCreators(saved, source.getCreators());

		// Copy locations
		copyLocations(saved, source.getLocations());

		saved.setCurrentVersion(source.getUuid());

		// Make dataset publicly not-readable
		aclService.makePubliclyReadable(saved, false);

		// Make dataset folder
		ensureDatasetFolder(saved);

		return saved;
	}

	/**
	 * Copy and save dataset accessionRefs.
	 *
	 * @param target the target
	 * @param accessionRefs the dataset accessionRefs
	 * @return
	 */
	private Dataset copyAccessionRefs(final Dataset target, final List<DatasetAccessionRef> accessionRefs) {
		if (accessionRefs == null || accessionRefs.size() == 0) {
			return target;
		}

		Dataset loadedDataset = getDataset(target);
		List<DatasetAccessionRef> copiedAccessionRefs = Lists.newArrayList();
		getDistinctAccessionRefs(accessionRefs).forEach(dAccessionRef -> {
			DatasetAccessionRef copy = new DatasetAccessionRef();
			copyAccessionRef(copy, dAccessionRef);
			copy.setDataset(loadedDataset);
			copiedAccessionRefs.add(copy);
		});

		accessionRefRepository.saveAll(copiedAccessionRefs);

		loadedDataset.setAccessionCount((int) accessionRefRepository.countByList(loadedDataset));
		log.info("Done saving {} accession refs, have {} in dataset", accessionRefs.size(), loadedDataset.getAccessionCount());
		return repository.save(loadedDataset);
	}

	/**
	 * Copy and save dataset locations.
	 *
	 * @param target the target
	 * @param locations the dataset locations
	 */
	private void copyLocations(final Dataset target, final List<DatasetLocation> locations) {
		if (locations == null || locations.size() == 0) {
			return;
		}

		List<DatasetLocation> copiedLocations = Lists.newArrayList();
		locations.forEach(location -> {
			DatasetLocation copy = new DatasetLocation();
			copyLocation(copy, location);
			copy.setDataset(target);
			copiedLocations.add(copy);
		});
		target.setLocations(locationRepository.saveAll(copiedLocations));
	}

	/**
	 * Copy and save dataset creators.
	 *
	 * @param target the target
	 * @param creators the dataset creators
	 */
	private void copyCreators(final Dataset target, final List<DatasetCreator> creators) {
		if (creators == null || creators.size() == 0) {
			return;
		}

		List<DatasetCreator> copiedCreators = Lists.newArrayList();
		creators.forEach(creator -> {
			DatasetCreator copy = new DatasetCreator();
			copyCreator(copy, creator);
			copy.setDataset(target);
			copiedCreators.add(copy);
		});
		target.setCreators(datasetCreatorRepository.saveAll(copiedCreators));
	}

	private RepositoryFolder ensureDatasetFolder(final Dataset dataset) {
		try {
			final Path datasetPath = Paths.get(datasetRepositoryPath, dataset.getUuid().toString());

			// Ensure folder ownership
			return asAdminInvoker.invoke(() -> {
				// Ensure target folder exists for the Dataset
				return repositoryService.ensureFolder(datasetPath, dataset);
			});

		} catch (Exception e) {
			log.warn("Could not create folder: {}", e.getMessage());
			throw new InvalidApiUsageException("Could not create folder", e);
		}
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@PostAuthorize("hasRole('ADMINISTRATOR') || returnObject==null || returnObject.isPublished() || hasPermission(returnObject, 'read')")
	public Dataset loadDataset(final Dataset input) {
		final Dataset dataset = getDataset(input);
		return lazyLoad(dataset);
	}

	private Dataset getDataset(final Dataset input) {
		log.debug("Load Dataset. Input data {}", input);
		final Dataset dataset = repository.findById(input.getId()).orElse(null);

		if (dataset == null) {
			throw new NotFoundElement("Record not found by id=" + input.getId());
		}

		if (!dataset.getVersion().equals(input.getVersion())) {
			log.warn("Dataset versions don't match anymore");
			throw new ConcurrencyFailureException("Object version changed to " + dataset.getVersion() + ", you provided " + input.getVersion());
		}
		return dataset;
	}

	private Dataset getUnpublishedDataset(final Dataset input) {
		Dataset loadedDataset = getDataset(input);
		if (loadedDataset.isPublished()) {
			throw new InvalidApiUsageException("Cannot modify a published Dataset.");
		}
		return loadedDataset;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public Page<Dataset> list(final DatasetFilter filter, final Pageable page) throws SearchException {
		final BooleanBuilder published = new BooleanBuilder();
		published.and(QDataset.dataset.state.eq(PublishState.PUBLISHED).and(QDataset.dataset.current.isTrue()));
		Page<Dataset> res;
		final Pageable markdownSortPageRequest = JPAUtils.toMarkdownSort(page, "title");

		if (filter.isFulltextQuery()) {
			res = elasticsearchService.findAll(Dataset.class, filter, published, markdownSortPageRequest);
		} else {
			res = repository.findAll(published.and(filter.buildPredicate()), markdownSortPageRequest);
		}
		return new PageImpl<>(res.getContent(), page, res.getTotalElements());
	}

	@Override
	@Transactional(readOnly = true)
	public Page<DatasetTranslationService.TranslatedDataset> listTranslated(final DatasetFilter filter, final Pageable page) throws SearchException {
		var datasetPage = list(filter, page);
		var translatedDatasets = translationSupport.getTranslated(datasetPage.getContent());
		return new PageImpl<>(translatedDatasets, page, datasetPage.getTotalElements());
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public Map<String, ElasticsearchService.TermResult> getSuggestions(DatasetFilter filter) throws SearchException, IOException {
		assert (filter != null);

		Set<String> suggestions = Sets.newHashSet("crops");
		Map<String, ElasticsearchService.TermResult> suggestionRes = new HashMap<>(suggestions.size());

		if (elasticsearchService == null) {
			return suggestionRes; // If we don't have ES, then suggest nothing
		}

		for (String suggestionKey : suggestions) {
			DatasetFilter suggestionFilter = filter.copy(DatasetFilter.class);
			suggestionFilter.state(PublishState.PUBLISHED);
			try {
				suggestionFilter.clearFilter(suggestionKey);
			} catch (NoSuchFieldException | IllegalAccessException e) {
				log.error("Error while clearing filter: ", e.getMessage());
			}
			suggestionFilter.current(true);
			ElasticsearchService.TermResult suggestion = elasticsearchService.termStatisticsAuto(Dataset.class, suggestionFilter, 100, suggestionKey);
			suggestionRes.put(suggestionKey, suggestion);
		}
		return suggestionRes;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public long countDatasets(DatasetFilter filter) throws SearchException {
		if (filter.isFulltextQuery()) {
			return elasticsearchService.count(Dataset.class, filter);
		}
		return repository.count(filter.buildPredicate());
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public Page<Dataset> listDatasetsForCurrentUser(final DatasetFilter filter, final Pageable page) throws SearchException {
		final Pageable markdownSortPageRequest = JPAUtils.toMarkdownSort(page, "title");
		Page<Dataset> res;
		if (securityUtils.hasRole(UserRole.ADMINISTRATOR)) {
			if (filter.isFulltextQuery()) {
				res = elasticsearchService.findAll(Dataset.class, filter, markdownSortPageRequest);
			} else {
				res = repository.findAll(filter.buildPredicate(), markdownSortPageRequest);
			}
		} else {
			final HashSet<Long> partners = new HashSet<>(securityUtils.listObjectIdentityIdsForCurrentUser(Partner.class, BasePermission.WRITE));
			if (filter.isFulltextQuery()) {
				res = elasticsearchService.findAll(Dataset.class, filter, dataset.owner().id.in(partners), markdownSortPageRequest);
			} else {
				res = repository.findAll(dataset.owner().id.in(partners).and(filter.buildPredicate()), markdownSortPageRequest);
			}
		}
		return new PageImpl<>(res.getContent(), page, res.getTotalElements());
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public Page<Dataset> loadCurrentVersionList(final Pageable page) {
		return repository.listAllCurrentVersion(page);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@PostAuthorize("hasRole('ADMINISTRATOR') || returnObject==null || returnObject.isPublished() || hasPermission(returnObject, 'read')")
	public Dataset loadDataset(final UUID uuid) {
		final Dataset dataset = repository.findByUuid(uuid);
		return lazyLoad(dataset);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@PostAuthorize("hasRole('ADMINISTRATOR') || returnObject==null || returnObject.entity.isPublished() || hasPermission(returnObject.entity, 'read')")
	public DatasetTranslationService.TranslatedDataset loadTranslatedDataset(final UUID uuid) {
		final Dataset dataset = repository.findByUuid(uuid);
		if (dataset == null) {
			throw new NotFoundElement("No such dataset");
		}
		var translatedDataset = translationSupport.getTranslated(dataset);
		translatedDataset.setDescriptors(descriptorTranslationService.getTranslated(translatedDataset.getEntity().getDescriptors()));
		return translatedDataset;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@PostAuthorize("hasRole('ADMINISTRATOR') || returnObject==null || returnObject.isPublished() || hasPermission(returnObject, 'read')")
	public Dataset loadDataset(final UUID uuid, final int version) {
		final Dataset dataset = repository.findByUuidAndVersion(uuid, version);
		return lazyLoad(dataset);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') || #dataset.published || hasPermission(#dataset, 'read')")
	public Page<DatasetAccessionRef> listAccessions(Dataset dataset, final Pageable page) {
		dataset = repository.findByUuid(dataset.getUuid());

		return accessionRefRepository.findByList(dataset, page);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public List<Dataset> listByAccession(final Accession accession) {
		final Iterable<Dataset> datasets = repository.findAll(dataset.accessionRefs.any().accession().eq(accession).and(dataset.state.in(PublishState.PUBLISHED).and(dataset.current.isTrue())));
		return Lists.newArrayList(datasets);
	}

	/**
	 * {@inheritDoc}
	 */
	@Transactional
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public Dataset addDatasetFile(Dataset dataset, final MultipartFile file) throws NotFoundElement, IOException, InvalidRepositoryPathException,
			InvalidRepositoryFileDataException {
		dataset = getUnpublishedDataset(dataset);

		final RepositoryFile repositoryFile = repositoryService.addFile(getDatasetRepositoryFolder(dataset), file.getOriginalFilename(), file.getContentType(), file.getInputStream(), null);

		dataset.getRepositoryFiles().add(repositoryFile);
		return lazyLoad(repository.save(dataset));
	}

	@Override
	public Path getDatasetRepositoryFolder(Dataset dataset) {
		assert (dataset != null);
		assert (dataset.getUuid() != null);

		return Paths.get(datasetRepositoryPath, dataset.getUuid().toString()).toAbsolutePath();
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public Dataset updateDatasetFile(Dataset dataset, final RepositoryFile metadata) throws NoSuchRepositoryFileException {
		dataset = getUnpublishedDataset(dataset);

		final RepositoryFile datasetFile = dataset.getRepositoryFiles().stream().filter(df -> df.getUuid().equals(metadata.getUuid()) && df.getVersion().equals(metadata
			.getVersion())).findFirst().orElse(null);
		if (datasetFile == null) {
			throw new NotFoundElement("No such dataset file");
		}
		final RepositoryFile updated = repositoryService.updateMetadata(metadata);
		// replace it
		dataset.getRepositoryFiles().replaceAll(df -> df.getUuid().equals(datasetFile.getUuid()) ? updated : df);
		return lazyLoad(dataset);
	}

	/**
	 * {@inheritDoc}
	 */
	@Transactional
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public Dataset removeDatasetFile(Dataset dataset, final UUID fileUuid) throws NotFoundElement, NoSuchRepositoryFileException, IOException {
		dataset = getUnpublishedDataset(dataset);

		final RepositoryFile repositoryFile = repositoryService.getFile(fileUuid);
		dataset.setRepositoryFiles(dataset.getRepositoryFiles().stream().filter(file -> !file.getUuid().equals(fileUuid)).collect(Collectors.toList()));
		repositoryService.removeFile(repositoryFile);
		return lazyLoad(repository.save(dataset));
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@PreAuthorize("#dataset.isPublished() || hasRole('ADMINISTRATOR') || hasPermission(#dataset, 'read')")
	public List<RepositoryFile> listDatasetFiles(final Dataset dataset) throws NotFoundElement {
		var loaded = reload(dataset);
		loaded.getRepositoryFiles().size();
		return loaded.getRepositoryFiles();
	}

	/**
	 * Deep load dataset data.
	 *
	 * @param dataset dataset to deepload
	 * @return fully loaded dataset
	 */
	private Dataset lazyLoad(final Dataset dataset) {
		if (dataset == null) {
			throw new NotFoundElement("No such dataset");
		}

		if (dataset.getDescriptors() != null) {
			dataset.getDescriptors().size();
		}
		if (dataset.getVersions() != null && dataset.getVersions().getAllVersions() != null) {
			dataset.getVersions().getAllVersions().size();
		}
		if (dataset.getRepositoryFiles() != null) {
			dataset.getRepositoryFiles().size();
		}
		if (dataset.getCreators() != null) {
			dataset.getCreators().size();
		}
		if (dataset.getLocations() != null) {
			dataset.getLocations().size();
		}
		if (dataset.getCrops() != null) {
			dataset.getCrops().size();
		}
		return dataset;
	}

	/**
	 * {@inheritDoc}
	 */
	@Transactional
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'delete')")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset remove(final Dataset dataset) {
		final Dataset loadedDataset = getUnpublishedDataset(dataset);

		deleteAccessionRefs(loadedDataset);

		var files = List.copyOf(loadedDataset.getRepositoryFiles());
		loadedDataset.getRepositoryFiles().clear();
		entityManager.flush();

		for (RepositoryFile repositoryFile : files) {
			try {
				repositoryService.removeFile(repositoryFile);
			} catch (NoSuchRepositoryFileException | IOException e) {
				log.warn("Could not delete file {} from dataset {}", repositoryFile.getUuid(), dataset.getUuid());
			}
		}
		entityManager.flush();

		try {
			repositoryService.deleteFolder(getDatasetRepositoryFolder(dataset));
		} catch (InvalidRepositoryPathException | FolderNotEmptyException e) {
			log.warn("Could not delete folder {} from dataset {}: {}", getDatasetRepositoryFolder(dataset), dataset.getUuid(), e.getMessage());
		}

		repository.delete(loadedDataset);

		if (amphibianService != null) {
			try {
				amphibianService.removeDataset(loadedDataset);
			} catch (Throwable e) {
				log.warn("Could not remove Amphibian dataset {}: {}", loadedDataset, e.getMessage(), e);
			}
		}
		return loadedDataset;
	}

	/**
	 * {@inheritDoc}
	 */
	@Transactional
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset addAccessionRefs(final Dataset dataset, final Collection<DatasetAccessionRef> accessionRefs) throws NotFoundElement {
		final Dataset loadedDataset = getUnpublishedDataset(dataset.getUuid());

		final var existingRefCount = accessionRefRepository.countByList(loadedDataset);
		log.warn("Adding {} accession references to Dataset that now has {} refs.", accessionRefs.size(), existingRefCount);

		accessionRefs.forEach(ref -> ref.setDataset(loadedDataset)); // So that #equals works
		Lists.partition(new ArrayList<>(getDistinctAccessionRefs(accessionRefs)), 10000).stream().forEach(batch -> {
			List<DatasetAccessionRef> updatedRefs;
			if (existingRefCount == 0) {
				updatedRefs = accessionRefRepository.saveAllAndFlush(batch);
				log.warn("Added new {} accession references to Dataset.", updatedRefs.size());
			} else {
				updatedRefs = accessionRefRepository.findExisting(loadedDataset, batch);
				updatedRefs = accessionRefRepository.saveAllAndFlush(updatedRefs);
				log.info("Stored {} accession references to Dataset.", batch.size());
			}
			// Rematching is done in AccessionRefAspect!
		});

		loadedDataset.setAccessionCount(accessionRefRepository.countByList(loadedDataset));
		final var updatedDataset = repository.save(loadedDataset);
		log.info("Done saving {} accession refs to dataset {} has count={}", accessionRefs.size(), updatedDataset.getUuid(), updatedDataset.getAccessionCount());
		return lazyLoad(updatedDataset);
	}

	private Dataset getUnpublishedDataset(UUID uuid) {
		Dataset loadedDataset = repository.findByUuid(uuid);
		if (loadedDataset == null) {
			throw new NotFoundElement("Record not found by UUID=" + uuid);
		}
		if (loadedDataset.isPublished()) {
			throw new InvalidApiUsageException("Cannot modify a published Dataset.");
		}
		return loadedDataset;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR')")
	@NotifyOnPublished
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset approveDataset(final Dataset dataset) {
		Dataset loaded = getUnpublishedDataset(dataset);

		if (loaded.getState() == PublishState.DRAFT) {
			throw new InvalidApiUsageException("Dataset should be sent for review before publication");
		}

		for (final Descriptor descriptor : loaded.getDescriptors()) {
			if (descriptor.getState() != PublishState.PUBLISHED) {
				log.info("Publishing descriptor {}", descriptor);
				try {
					descriptorService.approveDescriptor(descriptor);
				} catch (InvalidApiUsageException e) {
					throw e;
				}
			}
		}

		loaded.setState(PublishState.PUBLISHED);

		// generate file with metadata and add it to the dataset
		try {
			File tempFile = File.createTempFile("dataset-", ".xlsx");
			try (final OutputStream bos = new BufferedOutputStream(new FileOutputStream(tempFile, false), 8 * 1000)) {
				downloadService.writeXlsxDataset(loaded, bos);

				final String fileName = "Metadata.xlsx";
				final String contentType = "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet";
				try {
					final RepositoryFile datasetFile = repositoryService.getFile(Paths.get(datasetRepositoryPath, loaded.getUuid().toString()), fileName);
					repositoryService.updateBytes(datasetFile, contentType, tempFile);
				} catch (final NoSuchRepositoryFileException | InvalidRepositoryPathException e) {
					try {
						RepositoryFile metadata = new RepositoryFile();
						metadata.setTitle("Dataset metadata");
						metadata.setDescription("Auto-generated by Genesys");
						final RepositoryFile addedFile = repositoryService.addFile(getDatasetRepositoryFolder(loaded), fileName, contentType, tempFile, metadata);
						loaded.getRepositoryFiles().add(addedFile);
						loaded = lazyLoad(repository.save(loaded));
					} catch (final InvalidRepositoryPathException | InvalidRepositoryFileDataException e1) {
						log.warn("Error while adding metadata file.", e1);
					}
				}
			} finally {
				if (tempFile.exists()) tempFile.delete();
			}
		} catch (final IOException e) {
			log.warn("Error while generating metadata file.", e);
		}

		{
			// Relax permissions on dataset files: allow USERS and ANONYMOUS to read the
			// files
			for (final RepositoryFile datasetFile : loaded.getRepositoryFiles()) {
				aclService.makePubliclyReadable(datasetFile, true);
			}
		}

		// Make dataset publicly readable
		aclService.makePubliclyReadable(loaded, true);

		final DatasetVersions datasetVersions = loaded.getVersions();
		final Dataset oldCurrentDataset = datasetVersions.getAllVersions().stream().filter(s -> Objects.equals(s.getCurrent(), Boolean.TRUE)).findFirst().orElse(null);
		if (oldCurrentDataset != null) {
			oldCurrentDataset.setCurrent(null);
			repository.save(oldCurrentDataset);
		}
		loaded.setCurrent(Boolean.TRUE);
		loaded.setCurrentVersion(null);
		datasetVersions.setCurrentVersion(loaded);
		datasetVersionsRepository.save(datasetVersions);

		return lazyLoad(repository.save(loaded));
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	@NotifyForReview
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset reviewDataset(final Dataset dataset) {
		final Dataset loaded = getUnpublishedDataset(dataset);

		if (loaded.getState() == PublishState.REVIEWING) {
			throw new InvalidApiUsageException("The dataset is already under approval");
		}

		for (final Descriptor descriptor : loaded.getDescriptors()) {
			if (descriptor.getState() == PublishState.DRAFT) {
				log.info("Submitting descriptor for review {}", descriptor);
				try {
					descriptorService.reviewDescriptor(descriptor);
				} catch (InvalidApiUsageException e) {
					throw e;
				}
			}
		}

		loaded.setState(PublishState.REVIEWING);

		return lazyLoad(repository.save(loaded));
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'administration')")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset rejectDataset(final Dataset dataset) {
		Dataset loaded = getDataset(dataset);
		if (loaded == null) {
			throw new NotFoundElement("No dataset with specified uuid and version");
		}

		if (loaded.isPublished() && !securityUtils.hasRole(UserRole.ADMINISTRATOR)) {
			long oneDay = 24 * 60 * 60 * 1000;
			if (loaded.getLastModifiedDate() != null && loaded.getLastModifiedDate().toEpochMilli() <= (System.currentTimeMillis() - oneDay)) {
				throw new InvalidApiUsageException("Cannot be un-published. More than 24 hours have passed since the publication.");
			}
		}

		if (loaded.isPublished() && Objects.equals(loaded.getCurrent(), true)) {
			final DatasetVersions datasetVersions = loaded.getVersions();
			List<Dataset> notCurrentPublishedVersions = datasetVersions.getAllVersions().stream()
					.filter(d -> d.getCurrent() == null && d.isPublished()).collect(Collectors.toList());

			if (!notCurrentPublishedVersions.isEmpty()) {
				UUID youngestDatasetUUID = notCurrentPublishedVersions.stream()
						.max(Comparator.comparing(Dataset::getCreatedDate)).get().getUuid();

				loaded.setCurrent(null);
				repository.save(loaded);

				Dataset youngestDataset = repository.findByUuid(youngestDatasetUUID);
				youngestDataset.setCurrent(true);
				repository.save(youngestDataset);
				datasetVersions.setCurrentVersion(youngestDataset);
				loaded.setCurrentVersion(youngestDatasetUUID);
			} else {
				loaded.setCurrent(null);
				datasetVersions.setCurrentVersion(null);
			}
			datasetVersionsRepository.save(datasetVersions);
		} else if (loaded.isPublished() && Objects.isNull(loaded.getCurrent())) {
			throw new InvalidApiUsageException("Cannot be un-published. The dataset is not the latest version.");
		}

		loaded.setState(PublishState.DRAFT);

		{
			// Tighten permissions on dataset files
			for (final RepositoryFile datasetFile : loaded.getRepositoryFiles()) {
				aclService.makePubliclyReadable(datasetFile, false);
			}
		}

		// Make dataset publicly not-readable
		aclService.makePubliclyReadable(loaded, false);

		return lazyLoad(repository.save(loaded));
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public List<Object[]> lastPublished() {
		return repository.lastPublished();
	}

	/**
	 * {@inheritDoc}
	 */
	@Transactional
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public DatasetCreator createDatasetCreator(Dataset dataset, final DatasetCreator input) throws NotFoundElement {
		dataset = getUnpublishedDataset(dataset);
		input.setDataset(dataset);
		return datasetCreatorRepository.save(input);
	}

	/**
	 * {@inheritDoc}
	 */
	@Transactional
	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public DatasetCreator removeDatasetCreator(Dataset dataset, final DatasetCreator input) throws NotFoundElement {
		dataset = getUnpublishedDataset(dataset);

		final DatasetCreator datasetCreator = loadDatasetCreator(input);
		if (!datasetCreator.getDataset().getUuid().equals(dataset.getUuid())) {
			throw new InvalidApiUsageException("Creator does not belong to dataset");
		}
		datasetCreatorRepository.delete(datasetCreator);

		return datasetCreator;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public Page<DatasetCreator> listDatasetCreators(final UUID datasetUuid, final Pageable page) {
		return datasetCreatorRepository.listByUUidOfDataset(page, datasetUuid);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public DatasetCreator loadDatasetCreator(final DatasetCreator input) throws NotFoundElement {
		log.info("Load DatasetCreator {}", input);
		final DatasetCreator datasetCreator = datasetCreatorRepository.findByUuid(input.getUuid());

		if (datasetCreator == null) {
			log.error("DatasetCreator {} not found", input);
			throw new NotFoundElement("DatasetCreator by " + input.getUuid().toString() + " no found");
		}
		if (!datasetCreator.getVersion().equals(input.getVersion())) {
			log.error("Don't match the version");
			throw new ConcurrencyFailureException("Object version changed to " + datasetCreator.getVersion() + ", you provided " + input.getVersion());
		}
		return datasetCreator;
	}

	@Override
	public DatasetCreator loadDatasetCreator(final UUID datasetCreatorUuid) throws NotFoundElement {
		log.info("Load DatasetCreator {}", datasetCreatorUuid);
		final DatasetCreator datasetCreator = datasetCreatorRepository.findByUuid(datasetCreatorUuid);
		if (datasetCreator == null) {
			log.error("DatasetCreator {} not found", datasetCreatorUuid);
			throw new NotFoundElement("DatasetCreator by " + datasetCreatorUuid.toString() + " no found");
		}
		return datasetCreator;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public List<DatasetCreator> loadDatasetCreators(Dataset dataset) throws NotFoundElement {
		dataset = getDataset(dataset);
		return dataset.getCreators();
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public DatasetCreator updateDatasetCreator(Dataset dataset, final DatasetCreator input) throws NotFoundElement {
		dataset = getUnpublishedDataset(dataset);

		final DatasetCreator datasetCreator = loadDatasetCreator(input);
		if (!datasetCreator.getDataset().getUuid().equals(dataset.getUuid())) {
			throw new InvalidApiUsageException("Creator does not belong to dataset");
		}
		copyCreator(datasetCreator, input);
		return datasetCreatorRepository.save(datasetCreator);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public List<DatasetCreator> autocompleteCreators(final String text) {
		final HashSet<Long> ids = new HashSet<>(securityUtils.listObjectIdentityIdsForCurrentUser(Dataset.class, BasePermission.WRITE));
		final Predicate predicate = datasetCreator.dataset().id.in(ids).and(datasetCreator.fullName.startsWithIgnoreCase(text).or(datasetCreator.institutionalAffiliation
			.startsWithIgnoreCase(text)));
		return datasetCreatorRepository.findAll(predicate, PageRequest.of(0, 20, Sort.by("fullName"))).getContent();
	}

	/**
	 * Copy creator values.
	 *
	 * @param target the target
	 * @param source the source
	 */
	private void copyCreator(final DatasetCreator target, final DatasetCreator source) {
		target.setFullName(source.getFullName());
		target.setEmail(source.getEmail());
		target.setPhoneNumber(source.getPhoneNumber());
		target.setFax(source.getFax());
		target.setInstituteAddress(source.getInstituteAddress());
		target.setInstitutionalAffiliation(source.getInstitutionalAffiliation());
		target.setRole(source.getRole());
	}

	/**
	 * Copy location values.
	 *
	 * @param target the target
	 * @param source the source
	 */
	private void copyLocation(final DatasetLocation target, final DatasetLocation source) {
		target.setUserCountry(source.getUserCountry());
		target.setMapCountry(source.getMapCountry());
		target.setStateProvince(source.getStateProvince());
		target.setVerbatimLocality(source.getVerbatimLocality());
		target.setDecimalLatitude(source.getDecimalLatitude());
		target.setDecimalLongitude(source.getDecimalLongitude());
		target.setCountryCode(source.getCountryCode());
		target.setStartDate(source.getStartDate());
		target.setEndDate(source.getEndDate());
		target.setDescription(source.getDescription());
	}

	/**
	 * Copy dataset accessionRef values.
	 *
	 * @param target the target
	 * @param source the source
	 */
	private void copyAccessionRef(final DatasetAccessionRef target, final DatasetAccessionRef source) {
		target.setDoi(source.getDoi());
		target.setInstCode(source.getInstCode());
		target.setAcceNumb(source.getAcceNumb());
		target.setGenus(source.getGenus());
		target.setSpecies(source.getSpecies());
		target.setAccession(source.getAccession());
	}

	/**
	 * Copy values.
	 *
	 * @param target the target
	 * @param source the source
	 */
	private void copyValues(final Dataset target, final Dataset source) {
		target.setTitle(source.getTitle());
		target.setState(source.getState());
		target.setDescription(source.getDescription());
		target.setFormat(source.getFormat());
		target.setOriginalLanguageTag(source.getOriginalLanguageTag());
		target.setSubject(source.getSubject());
		target.setRights(source.getRights());
		target.setSource(source.getSource());
		target.setOwner(source.getOwner());
		target.setVersionTag(source.getVersionTag());
		target.setCreated(source.getCreated());
		target.setStartDate(source.getStartDate());
		target.setEndDate(source.getEndDate());

		if (source.getCrops() != null) {
			if (target.getCrops() == null) {
				target.setCrops(new HashSet<>());
			}
			target.getCrops().clear();
			target.getCrops().addAll(source.getCrops());
		}
	}

	/**
	 * Copy descriptors.
	 *
	 * @param target the target
	 * @param descriptors the descriptors
	 */
	private void copyDescriptors(final Dataset target, final List<Descriptor> descriptors) {
		if (descriptors == null || descriptors.size() == 0) {
			return;
		}

		target.getDescriptors().clear();
		target.getDescriptors().addAll(descriptors.stream().distinct().collect(Collectors.toList()));
	}

	@Override
	@Transactional(readOnly = false)
	@PreAuthorize("hasRole('ADMINISTRATOR')")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public void rematchDatasetAccessions() {
		repository.findAll().forEach(dataset -> {
			rematchDatasetAccessions(dataset);
		});
	}

	@Override
	@Transactional(readOnly = false)
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public Dataset rematchDatasetAccessions(Dataset dataset) {
		dataset = repository.findByUuid(dataset.getUuid());
		if (dataset == null) {
			return dataset;
		}
		List<DatasetAccessionRef> accessionRefs = dataset.getAccessionRefs();
		dataset.setAccessionCount(accessionRefs.size());
		dataset = repository.save(dataset);

		batchRematchAccessionRefs(accessionRefs);

		log.info("Done scheduling of relinking {} accession refs.", accessionRefs.size());
		return lazyLoad(dataset);
	}

	/**
	 * Schedule re-matching of AccessionRefs in batches
	 * 
	 * @param accessionRefs
	 */
	@Override
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public void batchRematchAccessionRefs(List<DatasetAccessionRef> accessionRefs) {
		Lists.partition(accessionRefs, 10000).parallelStream().forEach((batch) -> {
			taskExecutor.execute(() -> {
				try {
					log.info("Rematching {} dataset refs", batch.size());
					// Thread.sleep(100);
					accessionRefMatcher.rematchAccessionRefs(batch, accessionRefRepository);
				} catch (Throwable e) {
					log.info("Rematch failed with {}", e.getMessage(), e);
				}
			});
		});
	}

	@Override
	@Transactional(readOnly = false, propagation = Propagation.REQUIRED, isolation = Isolation.READ_UNCOMMITTED)
	@CacheEvict(value = "accessionAmphibianDatasets", allEntries = true)
	public int clearAccessionRefs(Collection<Accession> accessions) {
		if (accessions == null || accessions.isEmpty()) {
			return 0;
		}

		Iterable<DatasetAccessionRef> referencedRefs = accessionRefRepository.findAll(QDatasetAccessionRef.datasetAccessionRef.accession().in(accessions));
		AtomicInteger counter = new AtomicInteger(0);
		referencedRefs.forEach((ref) -> {
			ref.setAccession(null);
			counter.incrementAndGet();
		});
		accessionRefRepository.saveAll(referencedRefs);

		return counter.get();
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public DatasetLocation createLocation(Dataset dataset, final DatasetLocation input) throws NotFoundElement {
		dataset = getUnpublishedDataset(dataset);

		log.info("Create DatasetLocation {} for dataset {}", input, dataset.getUuid());
		input.setDataset(dataset);
		DatasetLocation savedLocation = locationRepository.save(input);

		dataset.getLocations().add(savedLocation);
		dataset.setLastModifiedDate(Instant.now());
		repository.save(dataset);

		return savedLocation;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public DatasetLocation removeLocation(Dataset dataset, final DatasetLocation input) throws NotFoundElement {
		dataset = getUnpublishedDataset(dataset);

		log.info("Remove DatasetLocation {} of dataset {}", input, dataset.getUuid());
		final DatasetLocation datasetLocation = loadLocation(input);
		if (!datasetLocation.getDataset().getUuid().equals(dataset.getUuid())) {
			throw new InvalidApiUsageException("Location does not belong to dataset");
		}
		locationRepository.delete(datasetLocation);

		/// Force update of Dataset#startDate, Dataset#endDate
		dataset.getLocations().remove(datasetLocation);
		dataset.setLastModifiedDate(Instant.now());
		repository.save(dataset);

		return datasetLocation;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public List<DatasetLocation> listLocation(Dataset dataset) throws NotFoundElement {
		log.info("Load list DatasetLocation for dataset {}", dataset.getUuid());
		dataset = getDataset(dataset);
		dataset.getLocations().size();
		return dataset.getLocations();
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public Page<DatasetLocation> listLocation(final UUID datasetUuid, final Pageable page) {
		log.info("Load list DatasetLocation for dataset {}", datasetUuid);
		return locationRepository.listByUUidOfDataset(page, datasetUuid);
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public DatasetLocation loadLocation(final DatasetLocation input) throws NotFoundElement {
		log.info("Load DatasetLocation {}", input);

		final DatasetLocation datasetLocation = locationRepository.findByUuid(input.getUuid());

		if (datasetLocation == null) {
			log.error("DatasetLocation by UUID {} not found", input);
			throw new NotFoundElement("DatasetLocation " + input.getUuid().toString() + " no found");
		}
		if (!datasetLocation.getVersion().equals(input.getVersion())) {
			log.error("Don't match the version");
			throw new ConcurrencyFailureException("Object version changed to " + datasetLocation.getVersion() + ", you provided " + input.getVersion());
		}
		return datasetLocation;
	}

	/**
	 * {@inheritDoc}
	 */
	@Override
	public DatasetLocation loadLocation(final UUID locationUuid) throws NotFoundElement {
		log.info("Load list DatasetLocation by uuid {}", locationUuid);

		final DatasetLocation datasetLocation = locationRepository.findByUuid(locationUuid);

		if (datasetLocation == null) {
			log.error("DatasetLocation by UUID {} not found", locationUuid);
			throw new NotFoundElement("DatasetCreator by " + locationUuid.toString() + " no found");
		}
		return datasetLocation;
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public DatasetLocation updateLocation(Dataset dataset, final DatasetLocation input) throws NotFoundElement {
		dataset = getUnpublishedDataset(dataset);

		final DatasetLocation datasetLocation = loadLocation(input);
		if (!datasetLocation.getDataset().getUuid().equals(dataset.getUuid())) {
			throw new InvalidApiUsageException("Location does not belong to dataset");
		}
		copyValue(datasetLocation, input);

		DatasetLocation saved = locationRepository.save(datasetLocation);
		dataset.getLocations().remove(input);
		dataset.getLocations().add(saved);
		dataset.setStartDate(saved.getStartDate());
		dataset.setEndDate(saved.getEndDate());
		update(dataset);

		return saved;
	}

	/**
	 * Copy value.
	 *
	 * @param target the target
	 * @param source the source
	 */
	protected void copyValue(final DatasetLocation target, final DatasetLocation source) {
		target.setDescription(source.getDescription());

		target.setUserCountry(source.getUserCountry());
		target.setMapCountry(source.getMapCountry());
		target.setCountryCode(source.getCountryCode());

		target.setStateProvince(source.getStateProvince());
		target.setVerbatimLocality(source.getVerbatimLocality());

		target.setDecimalLatitude(source.getDecimalLatitude());
		target.setDecimalLongitude(source.getDecimalLongitude());

		target.setStartDate(source.getStartDate());
		target.setEndDate(source.getEndDate());
	}

	@Override
	@Transactional(propagation = Propagation.MANDATORY) // Need to be part of an existing transaction!
	@PreAuthorize("hasRole('ADMINISTRATOR')")
	public long changeInstitute(FaoInstitute currentInstitute, FaoInstitute newInstitute) {
		// Note: Dataset links to a Partner, not FaoInstitute!
		log.warn("Migrating datasets from {} to {}", currentInstitute.getCode(), newInstitute.getCode());

		// Update accession references
		var qAccessionRef = QDatasetAccessionRef.datasetAccessionRef;
		return jpaQueryFactory.update(qAccessionRef)
			// Update instCode
			.set(qAccessionRef.instCode, newInstitute.getCode())
			// WHERE
			.where(qAccessionRef.instCode.eq(currentInstitute.getCode()))
			// Execute
			.execute();
	}

	@Override
	@PreAuthorize("#dataset==null || #dataset.published || hasRole('ADMINISTRATOR') || hasPermission(#dataset, 'read')")
	public List<Descriptor> getDatasetDescriptors(Dataset dataset) {
		var datasetDescriptors = repository.findByUuid(dataset.getUuid()).getDescriptors();
		datasetDescriptors.forEach(Descriptor::lazyLoad);
		return datasetDescriptors;
	}

	@Override
	@Transactional
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#dataset, 'write')")
	public List<Descriptor> synchronizeDescriptors(Dataset dataset) {
		List<Descriptor> datasetDescriptors = new ArrayList<>(repository.findByUuid(dataset.getUuid()).getDescriptors());
		var amphibianDataset = amphibianService.getAmphibianDataset(dataset);
		var amphibianDescriptors = amphibianDataset.getColumns().keySet();
		
		// Remove descriptors that are not in Amphibian
		datasetDescriptors.removeIf(descriptor -> !amphibianDescriptors.contains(String.valueOf(descriptor.getUuid())));
		
		// Get and add missing amphibian descriptors
		var descriptorUuids = datasetDescriptors.stream().map(Descriptor::getUuid).collect(Collectors.toSet());
		var missingDescriptorUuids = amphibianDescriptors.stream()
			.map(UUID::fromString)
			.filter(uuid -> !descriptorUuids.contains(uuid))
			.collect(Collectors.toSet());
		descriptorRepository.findAll(QDescriptor.descriptor.uuid.in(missingDescriptorUuids)).forEach(datasetDescriptors::add);

		dataset.setDescriptors(datasetDescriptors);
		var updated = repository.save(dataset);
		
		return updated.getDescriptors();
	}

	@Override
	@Cacheable(value = "accessionAmphibianDatasets", keyGenerator = "shortFilterKeyGenerator")
	public Set<UUID> findAccessionsAmphibianDatasets(AccessionFilter accessionFilter) {
		QDataset qDataset = QDataset.dataset;
		var query = jpaQueryFactory.from(qDataset).select(qDataset.uuid);
		var predicate = qDataset.state.in(Set.of(PublishState.PUBLISHED));
		predicate = predicate.and(qDataset.current.eq(true));
		if (! accessionFilter.isEmpty()) {
			if (accessionFilter.isFulltextQuery()) {
				throw new InvalidApiUsageException("Full-text search not supported");

//				log.warn("Using ES to find accessions");
//				var accessionIds = new LinkedList<Long>();
//				elasticsearchService.processById(Accession.class, accessionFilter, accessionIds::addAll, null);
//				var qDar = QDatasetAccessionRef.datasetAccessionRef;
//				var refQuery = jpaQueryFactory.from(qDar).select(qDar.list().id).distinct().where(qDar.accession().id.in(accessionIds));
//
//				predicate = predicate.and(qDataset.id.in(refQuery.fetch()));

			} else {
				var qA = QAccession.accession;
				var subQuery = JPAExpressions.selectFrom(qA);
				accessionFilter.buildJpaQuery(subQuery, qA);
				var qDar = QDatasetAccessionRef.datasetAccessionRef;
				var refQuery = jpaQueryFactory.from(qDar).select(qDar.list().id).distinct().where(qDar.accession().in(subQuery));
	
				predicate = predicate.and(qDataset.id.in(refQuery.fetch()));

			}
		} else {
			throw new InvalidApiUsageException("Accession filter must not be empty");
		}
		query.where(predicate);

		try {
			List<UUID> datasetUuids = LoggerHelper.withSqlLogging(() -> query.fetch());
			var amphibianDatasets = amphibianService.getAmphibianDatasetsList(datasetUuids);
			return Collections.unmodifiableSet(amphibianDatasets.stream().map(dt -> UUID.fromString(dt.getKey())).collect(Collectors.toSet()));
		} catch (Exception e) {
			throw new InvalidApiUsageException("Could not query for traits", e);
		}
	}

	private Set<DatasetAccessionRef> getDistinctAccessionRefs(Collection<DatasetAccessionRef> accessionRefs) {
		var distinctRefs = new TreeSet<>(distinctAcceRefsComparator);
		distinctRefs.addAll(accessionRefs);
		return distinctRefs;
	}

	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') || #dataset.isPublished() || hasPermission(#dataset, 'read')")
	public List<DescriptorTranslationService.TranslatedDescriptor> loadTranslatedDescriptors(Dataset dataset) {
		var reloaded = repository.findById(dataset.getId()).orElseThrow();
		return descriptorTranslationService.getTranslated(reloaded.getDescriptors());
	}

	@Override
	@PreAuthorize("hasRole('ADMINISTRATOR') or hasPermission(#original, 'write')")
	public DatasetLang machineTranslate(Dataset original, String targetLanguage) throws TranslatorService.TranslatorException {
		if (Objects.equals(original.getOriginalLanguageTag(), targetLanguage)) {
			throw new InvalidApiUsageException("Source and target language are the same");
}

		var mt = new DatasetLang();
		mt.setMachineTranslated(true);
		mt.setLanguageTag(targetLanguage);
		mt.setEntity(original);

		if (translatorService == null) return mt;

		var builder = TranslatorService.TranslationStructuredRequest.builder()
			.targetLang(targetLanguage);

		if (! Objects.equals(Locale.ENGLISH.getLanguage(), targetLanguage) && ! Objects.equals(Locale.ENGLISH.getLanguage(), original.getOriginalLanguageTag())) {
			// Translations to other languages use the English version (either original or translated)
			var enTranslation = translationSupport.getLang(original, Locale.ENGLISH.getLanguage());
			if (enTranslation == null) {
				throw new InvalidApiUsageException("English text is not available.");
			}

			builder
				.sourceLang(enTranslation.getLanguageTag())
				.context(buildTranslationContext(Dataset.class, "title", enTranslation.getTitle(), Locale.ENGLISH))
				.texts(Map.of(
					"title", new FormattedText(TextFormat.markdown, enTranslation.getTitle()),
					"description", new FormattedText(TextFormat.markdown, enTranslation.getDescription())
				));

		} else {
			// Translations to English use the original texts

			var originLocale = Locale.forLanguageTag(original.getOriginalLanguageTag());
			builder
				.sourceLang(original.getOriginalLanguageTag())
				.context(buildTranslationContext(Dataset.class, "title", original.getTitle(), originLocale))
				.texts(Map.of(
					"title", new TranslatorService.FormattedText(TranslatorService.TextFormat.markdown, original.getTitle()),
					"description", new TranslatorService.FormattedText(TranslatorService.TextFormat.markdown, original.getDescription())
				));
		}

		var translations = translatorService.translate(builder.build());

		if (StringUtils.isNotBlank(original.getTitle())) {
			mt.setTitle(translations.getTexts().get("title"));
		}
		if (StringUtils.isNotBlank(original.getDescription())) {
			mt.setDescription(translations.getTexts().get("description"));
		}
		return mt;
	}
}