<?php
/**
 * Uses the fgetcsv() function to process CSV input.
 * The input is expected to be UTF8.
 * 
 * @see http://rfc.net/rfc4180.html
 * @package cms
 * @subpackage bulkloading
 * @author Ingo Schommer, Silverstripe Ltd. (<ingo>@silverstripe.com>)
 * 
 * @todo Support for deleting existing records not matched in the import (through relation checks)
 */
class CsvBulkLoader extends BulkLoader {
	
	/**
	 * Delimiter character (Default: comma).
	 *
	 * @var string
	 */
	public $delimiter = ',';
	
	/**
	 * Enclosure character (Default: doublequote)
	 *
	 * @var string
	 */
	public $enclosure = '"';
	
	/**
	 * Identifies if the loaded file has a header row.
	 * If a {@link self::$columnMap} is passed, we assume
	 * the file has no headerrow, unless explicitly noted.
	 *
	 * @var boolean
	 */
	public $hasHeaderRow = false;
	
	protected function processAll($filepath, $preview = false) {
		ini_set('auto_detect_line_endings',1);
		
		$file = fopen($filepath, 'r');
		if(!$file) return false;
		
		$results = new BulkLoader_Result();

		if($this->hasHeaderRow && $this->columnMap) {
			$columnRow = fgetcsv($file, 0, $this->delimiter, $this->enclosure);
			$columnMap = array();
			foreach($columnRow as $k => $origColumnName) {
				$origColumnName = trim($origColumnName);
				if(isset($this->columnMap[$origColumnName])) {
					$columnMap[$origColumnName] = $this->columnMap[$origColumnName];
				} else {
					$columnMap[$origColumnName] = null;
				}
				
			}
		} elseif($this->columnMap) {
			$columnMap = $this->columnMap;
		} else {
			// assuming that first row is column naming if no columnmap is passed
			$columnRow = fgetcsv($file, 0, $this->delimiter, $this->enclosure);
			$columnMap = array_combine($columnRow, $columnRow);
		}

		$rowIndex = 0;
		$rowIndex = 0;
		while (($row = fgetcsv($file, 0, $this->delimiter, $this->enclosure)) !== FALSE) {
			$rowIndex++;
			
			/*
			// the columnMap should have the same amount of columns as each record row
			if(count(array_keys($columnMap)) == count(array_values($row))) {
				user_error("CsvBulkLoader::processAll(): Columns in row {$rowIndex} don't match the \$columnMap", E_USER_WARNING);
			}
			*/
			
			$indexedRow = array();
			foreach($columnMap as $origColumnName => $fieldName) {
				// in case the row has less fields than the columnmap,
				// ignore the "leftover" mappings
				if(!isset($row[count($indexedRow)])) {
						user_error("CsvBulkLoader::processAll(): Columns in row {$rowIndex} don't match the \$columnMap", E_USER_NOTICE);
					continue;
				}
	
				$indexedRow[$origColumnName] = $row[count($indexedRow)];
			}

			$this->processRecord($indexedRow, $columnMap, $results);
		}
		
		fclose($file);
		
		return $results;
	}
	
	/**
	 * @todo Better messages for relation checks and duplicate detection
	 */
	protected function processRecord($record, $columnMap, &$results, $preview = false) {
		$class = $this->objectClass;
		
		// find existing object, or create new one
		$existingObj = $this->findExistingObject($record, $columnMap);
		$obj = ($existingObj) ? $existingObj : new $class(); 
		
		// first run: find/create any relations and store them on the object
		// we can't combine runs, as other columns might rely on the relation being present
		$relations = array();
		foreach($record as $origColumnName => $val) {
			$fieldName = $columnMap[$origColumnName];
			
			// don't bother querying of value is not set
			if($this->isNullValue($val)) continue;
			
			// checking for existing relations
			if(isset($this->relationCallbacks[$fieldName])) {
				// trigger custom search method for finding a relation based on the given value
				// and write it back to the relation (or create a new object)
				$relationName = $this->relationCallbacks[$fieldName]['relationname'];
				$relationObj = $obj->{$this->relationCallbacks[$fieldName]['callback']}($val, $record);
				if(!$relationObj || !$relationObj->exists()) {
					$relationClass = $obj->has_one($relationName);
					$relationObj = new $relationClass();
					$relationObj->write();
				}
				$obj->setComponent($relationName, $relationObj);
				$obj->{"{$relationName}ID"} = $relationObj->ID;
				$obj->write();
			} elseif(strpos($fieldName, '.') !== false) {
				// we have a relation column with dot notation
				list($relationName,$columnName) = split('\.', $fieldName);
				$relationObj = $obj->getComponent($relationName); // always gives us an component (either empty or existing)
				$obj->setComponent($relationName, $relationObj);
				$relationObj->write();
				$obj->{"{$relationName}ID"} = $relationObj->ID;
				$obj->write();
			}
			
			$obj->flushCache(); // avoid relation caching confusion
		}
		$id = ($preview) ? 0 : $obj->write();

		// second run: save data
		foreach($record as $origColumnName => $val) {
			$fieldName = $columnMap[$origColumnName];

			if($this->isNullValue($val, $fieldName)) continue;

			if($obj->hasMethod("import{$fieldName}")) {
				$obj->{"import{$fieldName}"}($val, $record);
			} elseif(strpos($fieldName, '.') !== false) {
				// we have a relation column
				list($relationName,$columnName) = split('\.', $fieldName);
				$relationObj = $obj->getComponent($relationName);
				$relationObj->{$columnName} = $val;
				$relationObj->write();
				$obj->flushCache(); // avoid relation caching confusion
			//} elseif($obj->hasField($fieldName) || $obj->hasMethod($fieldName)) {
			} else {
				// plain old value setter
				$obj->{$fieldName} = $val;
			}
		}
		
		// write record
		$id = ($preview) ? 0 : $obj->write();
		
		// @todo better message support
		$message = '';
		
		// save to results
		if($existingObj) {
			$results->addUpdated($obj, $message);
		} else {
			$results->addCreated($obj, $message);
		}
		
		// memory usage
		unset($existingObj);
		unset($obj);
	}
	
	/**
	 * Find an existing objects based on one or more uniqueness
	 * columns specified via {@link self::$duplicateChecks}
	 *
	 * @param array $record CSV data column
	 * @param array $columnMap
	 * @return unknown
	 */
	public function findExistingObject($record, $columnMap) {
		// checking for existing records (only if not already found)
		foreach($this->duplicateChecks as $fieldName => $duplicateCheck) {
			if(is_string($duplicateCheck)) {
				$SQL_fieldName = Convert::raw2sql($duplicateCheck); 
				if(!isset($record[$fieldName])) {
					return false;
					//user_error("CsvBulkLoader:processRecord: Couldn't find duplicate identifier '{$fieldName}' in columns", E_USER_ERROR);
				}
				$SQL_fieldValue = $record[$fieldName];
				$existingRecord = DataObject::get_one($this->objectClass, "`$SQL_fieldName` = '{$SQL_fieldValue}'");
				if($existingRecord) return $existingRecord;
			} elseif(is_array($duplicateCheck) && isset($duplicateCheck['callback'])) {
				$existingRecord = singleton($this->objectClass)->{$duplicateCheck['callback']}($record[$fieldName], $record);
				if($existingRecord) return $existingRecord;
			} else {
				user_error('CsvBulkLoader:processRecord: Wrong format for $duplicateChecks', E_USER_ERROR);
			}
		}
		
		return false;
	}
	
	
	/**
	 * Determine wether any loaded files should be parsed
	 * with a header-row (otherwise we rely on {@link self::$columnMap}.
	 *
	 * @return boolean
	 */
	public function hasHeaderRow() {
		return ($this->hasHeaderRow || isset($this->columnMap));
	}
	
}
?>