https://github.com/N-BodyShop/changa
Tip revision: e56b7faf8786109a8d865fc8b02966906f49cd28 authored by Cambridge on 30 April 2018, 06:07:45 UTC
All the changes for GPU local tree walk
All the changes for GPU local tree walk
Tip revision: e56b7fa
Sph.cpp
/*
* Routines to implement SPH.
* Main author: James Wadsley, as first implemented in GASOLINE.
* See Wadsley, J.~W., Stadel, J., Quinn, T.\ 2004.\ Gasoline: a flexible,
* parallel implementation of TreeSPH.\ New Astronomy 9, 137-158.
*/
#include "ParallelGravity.h"
#include "DataManager.h"
#include "smooth.h"
#include "Sph.h"
#include "SphUtils.h"
#include "physconst.h"
#ifndef MAXPATHLEN
#define MAXPATHLEN PATH_MAX
#endif
#include <float.h>
///
/// @brief initialize SPH quantities
///
/// Initial calculation of densities and internal energies, and cooling rates.
///
void
Main::initSph()
{
if(param.bDoGas) {
ckout << "Calculating densities/divv ...";
// The following smooths all GAS, and also marks neighbors of
// actives, and those who have actives as neighbors
// Starting is true
DenDvDxSmoothParams pDen(TYPE_GAS, 0, param.csm, dTime, 0,
param.bConstantDiffusion, 1, bHaveAlpha,
param.dConstAlphaMax);
double startTime = CkWallTimer();
double dfBall2OverSoft2 = 4.0*param.dhMinOverSoft*param.dhMinOverSoft;
treeProxy.startSmooth(&pDen, 1, param.nSmooth, dfBall2OverSoft2,
CkCallbackResumeThread());
ckout << " took " << (CkWallTimer() - startTime) << " seconds."
<< endl;
if(verbosity > 1 && !param.bConcurrentSph)
memoryStatsCache();
double dTuFac = param.dGasConst/(param.dConstGamma-1)
/param.dMeanMolWeight;
double z = 1.0/csmTime2Exp(param.csm, dTime) - 1.0;
if(param.bGasCooling) {
// Update cooling on the datamanager
dMProxy.CoolingSetTime(z, dTime, CkCallbackResumeThread());
if(!bIsRestarting) // Energy is already OK from checkpoint.
treeProxy.InitEnergy(dTuFac, z, dTime, CkCallbackResumeThread());
}
if(verbosity) CkPrintf("Initializing SPH forces\n");
nActiveSPH = nTotalSPH;
doSph(0, 0);
double duDelta[MAXRUNG+1];
double dStartTime[MAXRUNG+1];
for(int iRung = 0; iRung <= MAXRUNG; iRung++) {
duDelta[iRung] = 0.5e-7*param.dDelta;
dStartTime[iRung] = dTime;
}
treeProxy.updateuDot(0, duDelta, dStartTime, param.bGasCooling, 0, 1,
CkCallbackResumeThread());
}
}
// see below for definition.
bool arrayFileExists(const std::string filename, const int64_t count) ;
#include <sys/stat.h>
///
/// @brief Initialize cooling constants and integration data structures.
///
void Main::initCooling()
{
#ifndef COOLING_NONE
dMProxy.initCooling(param.dGmPerCcUnit, param.dComovingGmPerCcUnit,
param.dErgPerGmUnit, param.dSecUnit, param.dKpcUnit,
param.CoolParam, CkCallbackResumeThread());
/* Read in tables from files as necessary */
int cntTable = 0;
int nTableRows;
int nTableColumns;
char TableFileSuffix[20];
for (;;) {
CoolTableReadInfo(¶m.CoolParam, cntTable, &nTableColumns,
TableFileSuffix);
if (!nTableColumns) break;
cntTable++;
nTableRows = ReadASCII(TableFileSuffix, nTableColumns, NULL);
if (nTableRows) {
CkAssert(sizeof(double)*nTableRows*nTableColumns <= CL_NMAXBYTETABLE );
double *dTableData = (double *)malloc(sizeof(double)*nTableRows*nTableColumns);
CkAssert( dTableData != NULL );
nTableRows = ReadASCII(TableFileSuffix, nTableColumns, dTableData);
dMProxy.dmCoolTableRead(dTableData,nTableRows*nTableColumns,
CkCallbackResumeThread());
free(dTableData);
}
}
treeProxy.initCoolingData(CkCallbackResumeThread());
if(!bIsRestarting) { // meaning not restarting from a checkpoint.
struct stat s;
int err = stat(basefilename.c_str(), &s);
if(err != -1 && S_ISDIR(s.st_mode)) {
// The file is a directory; assume NChilada
int64_t nGas = 0;
nGas = ncGetCount(basefilename + "/gas/coolontime");
if(nGas == nTotalSPH) {
CkPrintf("Reading coolontime\n");
coolontimeOutputParams pCoolOnOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pCoolOnOut, param.bParaRead,
CkCallbackResumeThread());
}
}
else {
if(arrayFileExists(basefilename + ".coolontime", nTotalParticles)) {
CkPrintf("Reading coolontime\n");
coolontimeOutputParams pCoolOnOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pCoolOnOut, CkCallbackResumeThread());
}
}
}
#endif
}
/**
* Initialized Cooling Read-only data on the DataManager, which
* doesn't migrate.
*/
void
DataManager::initCooling(double dGmPerCcUnit, double dComovingGmPerCcUnit,
double dErgPerGmUnit, double dSecUnit, double dKpcUnit,
COOLPARAM inParam, const CkCallback& cb)
{
#ifndef COOLING_NONE
clInitConstants(Cool, dGmPerCcUnit, dComovingGmPerCcUnit, dErgPerGmUnit,
dSecUnit, dKpcUnit, inParam);
CoolInitRatesTable(Cool,inParam);
#endif
contribute(cb);
}
/**
* Per thread initialization
*/
void
TreePiece::initCoolingData(const CkCallback& cb)
{
#ifndef COOLING_NONE
bGasCooling = 1;
dm = (DataManager*)CkLocalNodeBranch(dataManagerID);
CoolData = CoolDerivsInit(dm->Cool);
#endif
contribute(cb);
}
void
DataManager::dmCoolTableRead(double *dTableData, int nData, const CkCallback& cb)
{
#ifndef COOLING_NONE
CoolTableRead(Cool, nData*sizeof(double), (void *) dTableData);
#endif
contribute(cb);
}
///
/// @brief function from PKDGRAV to read an ASCII table
///
/// @param extension Appended to outName to determine file name to
/// read.
/// @param nDataPerLine Number of columns in the table.
/// @param dDataOut pointer to array in which to store the table.
/// Note if dDataOut is NULL it just counts the number of valid input
/// lines.
///
int Main::ReadASCII(char *extension, int nDataPerLine, double *dDataOut)
{
FILE *fp;
int i,ret;
char achIn[160];
double *dData;
if (dDataOut == NULL)
dData = (double *)malloc(sizeof(double)*nDataPerLine);
else
dData = dDataOut;
CkAssert(nDataPerLine > 0 && nDataPerLine <= 10);
char achFile[MAXPATHLEN];
sprintf(achFile, "%s.%s", param.achOutName, extension);
fp = fopen(achFile,"r");
if (!fp) {
CkPrintf("WARNING: Could not open .%s input file:%s\n",
extension,achFile);
return 0;
}
i = 0;
while (1) {
if (!fgets(achIn,160,fp)) goto Done;
switch (nDataPerLine) {
case 1:
ret = sscanf(achIn,"%lf",dData);
break;
case 2:
ret = sscanf(achIn,"%lf %lf",dData,dData+1);
break;
case 3:
ret = sscanf(achIn,"%lf %lf %lf",dData,dData+1,dData+2);
break;
case 4:
ret = sscanf(achIn,"%lf %lf %lf %lf",dData,dData+1,dData+2,dData+3);
break;
case 5:
ret = sscanf(achIn,"%lf %lf %lf %lf %lf",dData,dData+1,dData+2,dData+3,dData+4);
break;
case 6:
ret = sscanf(achIn,"%lf %lf %lf %lf %lf %lf",dData,dData+1,dData+2,dData+3,dData+4,dData+5);
break;
case 7:
ret = sscanf(achIn,"%lf %lf %lf %lf %lf %lf %lf",
dData,dData+1,dData+2,dData+3,dData+4,dData+5,dData+6);
break;
case 8:
ret = sscanf(achIn,"%lf %lf %lf %lf %lf %lf %lf %lf",
dData,dData+1,dData+2,dData+3,dData+4,dData+5,dData+6,dData+7);
break;
case 9:
ret = sscanf(achIn,"%lf %lf %lf %lf %lf %lf %lf %lf %lf",
dData,dData+1,dData+2,dData+3,dData+4,dData+5,dData+6,dData+7,dData+8);
break;
case 10:
ret = sscanf(achIn,"%lf %lf %lf %lf %lf %lf %lf %lf %lf %lf",
dData,dData+1,dData+2,dData+3,dData+4,dData+5,dData+6,dData+7,dData+8,dData+9);
break;
default:
ret = EOF;
CkAssert(0);
}
if (ret != nDataPerLine) goto Done;
++i;
if (dDataOut != NULL) dData += nDataPerLine;
}
Done:
fclose(fp);
if (dDataOut != NULL && verbosity)
printf("Read %i lines from %s\n",i,achFile);
if (dDataOut == NULL) free(dData);
return i;
}
/*
* Update the cooling functions to the current time.
* This is on the DataManager to avoid duplication of effort.
*/
void
DataManager::CoolingSetTime(double z, // redshift
double dTime, // Time
const CkCallback& cb)
{
#ifndef COOLING_NONE
CoolSetTime( Cool, dTime, z );
#endif
contribute(cb);
}
/**
* @brief DataManager::SetStarCM saves the total mass and center of mass of the
* star(s) to the COOL struct Cool, making them available to the cool particles
* @param dCenterOfMass Array(length 4) which contains the star(s) center of
* mass as the first 3 entries and the total star mass as the final entry
* @param cb Callback
*/
void DataManager::SetStarCM(double dCenterOfMass[4], const CkCallback& cb) {
#ifndef COOLING_NONE
#ifdef COOLING_PLANET
CoolSetStarCM(Cool, dCenterOfMass);
#endif
#endif
contribute(cb);
}
/**
* @brief utility for checking array files
*/
bool
arrayFileExists(const std::string filename, const int64_t count)
{
FILE *fp = CmiFopen(filename.c_str(), "r");
if(fp != NULL) {
// Check if its a binary file
unsigned int iDum;
XDR xdrs;
xdrstdio_create(&xdrs, fp, XDR_DECODE);
xdr_u_int(&xdrs,&iDum);
xdr_destroy(&xdrs);
if(iDum == count) { // Assume a valid binary array file
fclose(fp);
return true;
}
fseek(fp, 0, SEEK_SET);
int64_t nIOrd;
fscanf(fp, "%ld", &nIOrd);
CkAssert(nIOrd == count); // Valid ASCII file.
fclose(fp);
return true;
}
return false;
}
/// @brief Set total metals based on Ox and Fe mass fractions
void
TreePiece::resetMetals(const CkCallback& cb)
{
for(unsigned int i = 1; i <= myNumParticles; ++i) {
GravityParticle *p = &myParticles[i];
// Use total metals to Fe and O based on Asplund et al 2009
if (p->isGas())
p->fMetals() = 1.06*p->fMFracIron() + 2.09*p->fMFracOxygen();
if (p->isStar())
p->fStarMetals() = 1.06*p->fStarMFracIron()
+ 2.09*p->fStarMFracOxygen();
}
contribute(cb);
}
#include <sys/stat.h>
/**
* @brief Read in array files for complete gas information.
*/
void
Main::restartGas()
{
if(verbosity)
CkPrintf("Restarting Gas Simulation with array files.\n");
struct stat s;
int err = stat(basefilename.c_str(), &s);
if(err != -1 && S_ISDIR(s.st_mode)) {
// The file is a directory; assume NChilada
int64_t nGas = 0;
int64_t nDark = 0;
int64_t nStar = 0;
if(nTotalSPH > 0)
nGas = ncGetCount(basefilename + "/gas/iord");
if(nTotalDark > 0)
nDark = ncGetCount(basefilename + "/dark/iord");
if(nTotalStar > 0)
nStar = ncGetCount(basefilename + "/star/iord");
if(nGas + nDark + nStar == nTotalParticles) {
IOrderOutputParams pIOrdOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pIOrdOut, param.bParaRead,
CkCallbackResumeThread());
CkReductionMsg *msg;
treeProxy.getMaxIOrds(CkCallbackResumeThread((void*&)msg));
CmiInt8 *maxIOrds = (CmiInt8 *)msg->getData();
nMaxOrderGas = maxIOrds[0];
nMaxOrderDark = maxIOrds[1];
nMaxOrder = maxIOrds[2];
delete msg;
}
else
CkError("WARNING: no iorder file, or wrong format for restart\n");
if(nTotalStar > 0)
nStar = ncGetCount(basefilename + "/star/igasorder");
if(nStar == nTotalStar) {
IGasOrderOutputParams pIOrdOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pIOrdOut, param.bParaRead,
CkCallbackResumeThread());
}
else
CkError("WARNING: no igasorder file, or wrong format for restart\n");
if(param.bFeedback) {
if(nTotalSPH > 0)
nGas = ncGetCount(basefilename + "/gas/ESNRate");
if(nTotalStar > 0)
nStar = ncGetCount(basefilename + "/star/ESNRate");
if(nGas + nStar == nTotalSPH + nTotalStar) {
ESNRateOutputParams pESNROut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pESNROut, param.bParaRead,
CkCallbackResumeThread());
}
else
CkError("WARNING: no ESNRate file, or wrong format for restart\n");
if(nTotalSPH > 0)
nGas = ncGetCount(basefilename + "/gas/OxMassFrac");
if(nTotalStar > 0)
nStar = ncGetCount(basefilename + "/star/OxMassFrac");
if(nGas + nStar == nTotalSPH + nTotalStar) {
OxOutputParams pOxOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pOxOut, param.bParaRead,
CkCallbackResumeThread());
}
else
CkError("WARNING: no OxMassFrac file, or wrong format for restart\n");
if(nTotalSPH > 0)
nGas = ncGetCount(basefilename + "/gas/FeMassFrac");
if(nTotalStar > 0)
nStar = ncGetCount(basefilename + "/star/FeMassFrac");
if(nGas + nStar == nTotalSPH + nTotalStar) {
FeOutputParams pFeOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pFeOut, param.bParaRead,
CkCallbackResumeThread());
}
else
CkError("WARNING: no FeMassFrac file, or wrong format for restart\n");
treeProxy.resetMetals(CkCallbackResumeThread());
if(nTotalStar > 0)
nStar = ncGetCount(basefilename + "/star/massform");
if(nStar == nTotalStar) {
MFormOutputParams pMFOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pMFOut, param.bParaRead,
CkCallbackResumeThread());
}
else
CkError("WARNING: no massform file, or wrong format for restart\n");
}
#ifdef CULLENALPHA
if(nTotalSPH > 0) {
nGas = ncGetCount(basefilename + "/gas/alpha");
if(nGas == nTotalSPH) {
AlphaOutputParams pAlphaOut(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pAlphaOut, param.bParaRead,
CkCallbackResumeThread());
bHaveAlpha = 1;
}
else
CkError("WARNING: no alpha file, or wrong format for restart\n");
}
#endif
#ifndef COOLING_NONE
if(param.bGasCooling && nTotalSPH > 0) {
bool bFoundCoolArray = false;
// read ionization fractions
nGas = ncGetCount(basefilename + "/gas/" + COOL_ARRAY0_EXT);
if(nGas == nTotalSPH) {
Cool0OutputParams pCool0Out(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pCool0Out, param.bParaRead,
CkCallbackResumeThread());
bFoundCoolArray = true;
}
else
CkError("WARNING: no CoolArray0 file, or wrong format for restart\n");
nGas = ncGetCount(basefilename + "/gas/" + COOL_ARRAY1_EXT);
if(nGas == nTotalSPH) {
Cool1OutputParams pCool1Out(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pCool1Out, param.bParaRead,
CkCallbackResumeThread());
bFoundCoolArray = true;
}
else
CkError("WARNING: no CoolArray1 file, or wrong format for restart\n");
nGas = ncGetCount(basefilename + "/gas/" + COOL_ARRAY2_EXT);
if(nGas == nTotalSPH) {
Cool2OutputParams pCool2Out(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pCool2Out, param.bParaRead,
CkCallbackResumeThread());
bFoundCoolArray = true;
}
else
CkError("WARNING: no CoolArray2 file, or wrong format for restart\n");
nGas = ncGetCount(basefilename + "/gas/" + COOL_ARRAY3_EXT);
if(nGas == nTotalSPH) {
Cool3OutputParams pCool3Out(basefilename, 6, 0.0);
treeProxy.readFloatBinary(pCool3Out, param.bParaRead,
CkCallbackResumeThread());
bFoundCoolArray = true;
}
else
CkError("WARNING: no CoolArray3 file, or wrong format for restart\n");
double dTuFac = param.dGasConst/(param.dConstGamma-1)
/param.dMeanMolWeight;
if(bFoundCoolArray) {
// reset thermal energy with ionization fractions
treeProxy.RestartEnergy(dTuFac, CkCallbackResumeThread());
}
else {
double z = 1.0/csmTime2Exp(param.csm, dTime) - 1.0;
dMProxy.CoolingSetTime(z, dTime, CkCallbackResumeThread());
treeProxy.InitEnergy(dTuFac, z, dTime, CkCallbackResumeThread());
}
}
#endif
} else {
// Assume TIPSY arrays
// read iOrder
if(arrayFileExists(basefilename + ".iord", nTotalParticles)) {
CkReductionMsg *msg;
IOrderOutputParams pIOrdOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pIOrdOut, CkCallbackResumeThread());
treeProxy.getMaxIOrds(CkCallbackResumeThread((void*&)msg));
CmiInt8 *maxIOrds = (CmiInt8 *)msg->getData();
nMaxOrderGas = maxIOrds[0];
nMaxOrderDark = maxIOrds[1];
nMaxOrder = maxIOrds[2];
delete msg;
}
else
CkError("WARNING: no iOrder file for restart\n");
// read iGasOrder
if(arrayFileExists(basefilename + ".igasorder", nTotalParticles)) {
IGasOrderOutputParams pIOrdOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pIOrdOut, CkCallbackResumeThread());
}
else {
CkError("WARNING: no igasorder file for restart\n");
}
if(param.bFeedback) {
if(arrayFileExists(basefilename + ".ESNRate", nTotalParticles)) {
ESNRateOutputParams pESNROut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pESNROut, CkCallbackResumeThread());
}
if(arrayFileExists(basefilename + ".OxMassFrac", nTotalParticles)) {
OxOutputParams pOxOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pOxOut, CkCallbackResumeThread());
}
if(arrayFileExists(basefilename + ".FeMassFrac", nTotalParticles)) {
FeOutputParams pFeOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pFeOut, CkCallbackResumeThread());
}
treeProxy.resetMetals(CkCallbackResumeThread());
if(arrayFileExists(basefilename + ".massform", nTotalParticles)) {
MFormOutputParams pMFOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pMFOut, CkCallbackResumeThread());
}
}
#ifdef CULLENALPHA
if(arrayFileExists(basefilename + ".alpha", nTotalParticles)) {
AlphaOutputParams pAlphaOut(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pAlphaOut, CkCallbackResumeThread());
bHaveAlpha = 1;
}
else
CkError("WARNING: no alpha file, or wrong format for restart\n");
#endif
#ifndef COOLING_NONE
if(param.bGasCooling) {
bool bFoundCoolArray = false;
// read ionization fractions
if(arrayFileExists(basefilename + "." + COOL_ARRAY0_EXT, nTotalParticles)) {
Cool0OutputParams pCool0Out(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pCool0Out, CkCallbackResumeThread());
bFoundCoolArray = true;
}
else {
CkError("WARNING: no CoolArray0 file for restart\n");
}
if(arrayFileExists(basefilename + "." + COOL_ARRAY1_EXT, nTotalParticles)) {
Cool1OutputParams pCool1Out(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pCool1Out, CkCallbackResumeThread());
bFoundCoolArray = true;
}
else {
CkError("WARNING: no CoolArray1 file for restart\n");
}
if(arrayFileExists(basefilename + "." + COOL_ARRAY2_EXT, nTotalParticles)) {
Cool2OutputParams pCool2Out(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pCool2Out, CkCallbackResumeThread());
bFoundCoolArray = true;
}
else {
CkError("WARNING: no CoolArray2 file for restart\n");
}
if(arrayFileExists(basefilename + "." + COOL_ARRAY3_EXT, nTotalParticles)) {
Cool3OutputParams pCool3Out(basefilename, 0, 0.0);
treeProxy.readTipsyArray(pCool3Out, CkCallbackResumeThread());
bFoundCoolArray = true;
}
else {
CkError("WARNING: no CoolArray3 file for restart\n");
}
double dTuFac = param.dGasConst/(param.dConstGamma-1)
/param.dMeanMolWeight;
if(bFoundCoolArray) {
// reset thermal energy with ionization fractions
treeProxy.RestartEnergy(dTuFac, CkCallbackResumeThread());
}
else {
double z = 1.0/csmTime2Exp(param.csm, dTime) - 1.0;
dMProxy.CoolingSetTime(z, dTime, CkCallbackResumeThread());
treeProxy.InitEnergy(dTuFac, z, dTime, CkCallbackResumeThread());
}
}
#endif
}
}
/*
* Initialize energy on restart
*/
void TreePiece::RestartEnergy(double dTuFac, // T to internal energy
const CkCallback& cb)
{
#ifndef COOLING_NONE
COOL *cl;
dm = (DataManager*)CkLocalNodeBranch(dataManagerID);
cl = dm->Cool;
#endif
for(unsigned int i = 1; i <= myNumParticles; ++i) {
GravityParticle *p = &myParticles[i];
if (p->isGas()) {
#ifndef COOLING_NONE
#ifndef COOLING_GRACKLE
double T;
T = p->u() / dTuFac;
PERBARYON Y;
CoolPARTICLEtoPERBARYON(cl, &Y, &p->CoolParticle());
p->u() = clThermalEnergy(Y.Total,T)*cl->diErgPerGmUnit;
#endif
#endif
p->uPred() = p->u();
}
}
contribute(cb);
}
/**
* @brief Perform the SPH force calculation.
* @param activeRung Timestep rung (and above) on which to perform
* SPH
* @param bNeedDensity Does the density calculation need to be done?
* Defaults to 1
*/
void
Main::doSph(int activeRung, int bNeedDensity)
{
if(bNeedDensity) {
double dfBall2OverSoft2 = 4.0*param.dhMinOverSoft*param.dhMinOverSoft;
if (param.bFastGas && nActiveSPH < nTotalSPH*param.dFracFastGas) {
ckout << "Calculating densities/divv on Actives ...";
// This also marks neighbors of actives
DenDvDxSmoothParams pDen(TYPE_GAS, activeRung, param.csm, dTime, 1,
param.bConstantDiffusion, 0, 0,
param.dConstAlphaMax);
double startTime = CkWallTimer();
treeProxy.startSmooth(&pDen, 1, param.nSmooth, dfBall2OverSoft2,
CkCallbackResumeThread());
ckout << " took " << (CkWallTimer() - startTime) << " seconds."
<< endl;
ckout << "Marking Neighbors ...";
// This marks particles with actives as neighbors
MarkSmoothParams pMark(TYPE_GAS, activeRung);
startTime = CkWallTimer();
treeProxy.startMarkSmooth(&pMark, CkCallbackResumeThread());
ckout << " took " << (CkWallTimer() - startTime) << " seconds."
<< endl;
ckout << "Density of Neighbors ...";
// This does neighbors (but not actives), It also does no
// additional marking
DenDvDxNeighborSmParams pDenN(TYPE_GAS, activeRung, param.csm, dTime,
param.bConstantDiffusion,
param.dConstAlphaMax);
startTime = CkWallTimer();
treeProxy.startSmooth(&pDenN, 1, param.nSmooth, dfBall2OverSoft2,
CkCallbackResumeThread());
ckout << " took " << (CkWallTimer() - startTime) << " seconds."
<< endl;
}
else {
ckout << "Calculating densities/divv ...";
// The following smooths all GAS, and also marks neighbors of
// actives, and those who have actives as neighbors.
DenDvDxSmoothParams pDen(TYPE_GAS, activeRung, param.csm, dTime, 0,
param.bConstantDiffusion, 0, 0,
param.dConstAlphaMax);
double startTime = CkWallTimer();
treeProxy.startSmooth(&pDen, 1, param.nSmooth, dfBall2OverSoft2,
CkCallbackResumeThread());
ckout << " took " << (CkWallTimer() - startTime) << " seconds."
<< endl;
if(verbosity > 1 && !param.bConcurrentSph)
memoryStatsCache();
}
}
treeProxy.sphViscosityLimiter(param.iViscosityLimiter, activeRung,
CkCallbackResumeThread());
double a = csmTime2Exp(param.csm,dTime);
double dDtCourantFac = param.dEtaCourant*a*2.0/1.6;
if(param.bGasCooling)
treeProxy.getCoolingGasPressure(param.dConstGamma,
param.dConstGamma-1,
dDtCourantFac,
param.dResolveJeans/csmTime2Exp(param.csm, dTime),
CkCallbackResumeThread());
else
treeProxy.getAdiabaticGasPressure(param.dConstGamma,
param.dConstGamma-1,
dDtCourantFac,
CkCallbackResumeThread());
ckout << "Calculating pressure gradients ...";
PressureSmoothParams pPressure(TYPE_GAS, activeRung, param.csm, dTime,
param.dConstAlpha, param.dConstBeta,
param.dThermalDiffusionCoeff, param.dMetalDiffusionCoeff,
param.dEtaCourant, param.dEtaDiffusion);
double startTime = CkWallTimer();
treeProxy.startReSmooth(&pPressure, CkCallbackResumeThread());
ckout << " took " << (CkWallTimer() - startTime) << " seconds."
<< endl;
treeProxy.ballMax(activeRung, 1.0+param.ddHonHLimit,
CkCallbackResumeThread());
}
/*
* Initialize energy and ionization state for cooling particles
*/
void TreePiece::InitEnergy(double dTuFac, // T to internal energy
double z, // redshift
double dTime,
const CkCallback& cb)
{
#ifndef COOLING_NONE
COOL *cl;
dm = (DataManager*)CkLocalNodeBranch(dataManagerID);
cl = dm->Cool;
#endif
for(unsigned int i = 1; i <= myNumParticles; ++i) {
GravityParticle *p = &myParticles[i];
if (TYPETest(p, TYPE_GAS) && p->rung >= activeRung) {
#ifndef COOLING_NONE
double T,E;
T = p->u() / dTuFac;
CoolInitEnergyAndParticleData(cl, &p->CoolParticle(), &E,
p->fDensity, T, p->fMetals() );
p->u() = E;
#endif
p->uPred() = p->u();
}
}
// Use shadow array to avoid reduction conflict
smoothProxy[thisIndex].ckLocal()->contribute(cb);
}
/**
* @brief Update the cooling rate (uDot)
*
* @param activeRung (minimum) rung being updated
* @param duDelta array of timesteps of length MAXRUNG+1
* @param dStartTime array of start times of length MAXRUNG+1
* @param bCool Whether cooling is on
* @param bUpdateState Whether the ionization factions need updating
* @param bAll Do all rungs below activeRung
* @param cb Callback.
*/
void TreePiece::updateuDot(int activeRung,
double duDelta[MAXRUNG+1], // timesteps
double dStartTime[MAXRUNG+1],
int bCool, // select equation of state
int bUpdateState, // update ionization fractions
int bAll, // update all rungs below activeRung
const CkCallback& cb)
{
#ifndef COOLING_NONE
double dt; // time in seconds
for(unsigned int i = 1; i <= myNumParticles; ++i) {
GravityParticle *p = &myParticles[i];
if (TYPETest(p, TYPE_GAS)
&& (p->rung == activeRung || (bAll && p->rung >= activeRung))) {
dt = CoolCodeTimeToSeconds(dm->Cool, duDelta[p->rung] );
double ExternalHeating = p->PdV();
ExternalHeating += p->fESNrate();
if ( bCool ) {
COOLPARTICLE cp = p->CoolParticle();
double E = p->u();
double r[3]; // For conversion to C
p->position.array_form(r);
double dtUse = dt;
if(dStartTime[p->rung] + 0.5*duDelta[p->rung]
< p->fTimeCoolIsOffUntil()) {
/* This flags cooling shutoff (e.g., from SNe) to
the cooling functions. */
dtUse = -dt;
p->uDot() = ExternalHeating;
}
CoolIntegrateEnergyCode(dm->Cool, CoolData, &cp, &E,
ExternalHeating, p->fDensity,
p->fMetals(), r, dtUse);
CkAssert(E > 0.0);
if(dtUse > 0 || ExternalHeating*duDelta[p->rung] + p->u() < 0)
// linear interpolation over interval
p->uDot() = (E - p->u())/duDelta[p->rung];
if (bUpdateState) p->CoolParticle() = cp;
}
else {
p->uDot() = ExternalHeating;
}
}
}
#endif
// Use shadow array to avoid reduction conflict
smoothProxy[thisIndex].ckLocal()->contribute(cb);
}
/* Set a maximum ball for inverse Nearest Neighbor searching */
void TreePiece::ballMax(int activeRung, double dhFac, const CkCallback& cb)
{
for(unsigned int i = 1; i <= myNumParticles; ++i) {
if (TYPETest(&myParticles[i], TYPE_GAS)) {
myParticles[i].fBallMax() = myParticles[i].fBall*dhFac;
}
}
// Use shadow array to avoid reduction conflict
smoothProxy[thisIndex].ckLocal()->contribute(cb);
}
int DenDvDxSmoothParams::isSmoothActive(GravityParticle *p)
{
if(bActiveOnly && p->rung < activeRung)
return 0; // not active
return (TYPETest(p, iType));
}
// Non-active neighbors of Actives
int DenDvDxNeighborSmParams::isSmoothActive(GravityParticle *p)
{
if(p->rung < activeRung && TYPETest(p, iType)
&& TYPETest(p, TYPE_NbrOfACTIVE))
return 1;
return 0;
}
// Only do actives
int MarkSmoothParams::isSmoothActive(GravityParticle *p)
{
if(p->rung < activeRung)
return 0; // not active
return (TYPETest(p, iType));
}
/// A remote neighbor particle is active.
void MarkSmoothParams::combSmoothCache(GravityParticle *p1,
ExternalSmoothParticle *p2)
{
p1->iType |= p2->iType;
}
void DenDvDxSmoothParams::initSmoothParticle(GravityParticle *p)
{
TYPEReset(p, TYPE_NbrOfACTIVE);
}
void DenDvDxSmoothParams::initTreeParticle(GravityParticle *p)
{
TYPEReset(p, TYPE_NbrOfACTIVE);
}
void DenDvDxSmoothParams::postTreeParticle(GravityParticle *p)
{
#ifdef CULLENALPHA
if(p->isGas())
p->dvds_old() = p->dvdsOnSFull();
#endif
}
void DenDvDxSmoothParams::initSmoothCache(GravityParticle *p)
{
}
void DenDvDxSmoothParams::combSmoothCache(GravityParticle *p1,
ExternalSmoothParticle *p2)
{
p1->iType |= p2->iType;
}
/* Gather only version */
void DenDvDxSmoothParams::fcnSmooth(GravityParticle *p, int nSmooth,
pqSmoothNode *nnList)
{
double ih2,ih, r2,rs,rs1,fDensity,fNorm,fNorm1,vFac;
double dvxdx, dvxdy, dvxdz, dvydx, dvydy, dvydz, dvzdx, dvzdy, dvzdz;
double dvx,dvy,dvz,dx,dy,dz,trace,grx,gry,grz;
#ifdef CULLENALPHA
double R_CD, R_CDN; ///< R in CD limiter, and
/// normalization for R.
double maxVSignal; ///< Maximum signal velocity
R_CD = 0.0; R_CDN = 0; maxVSignal = 0.0;
#endif
double divvnorm = 0.0;
GravityParticle *q;
int i;
unsigned int qiActive;
ih2 = invH2(p);
ih = sqrt(ih2);
vFac = 1./(a*a); /* converts v to xdot */
fNorm = M_1_PI*ih2*sqrt(ih2);
fDensity = 0.0;
dvxdx = 0; dvxdy = 0; dvxdz= 0;
dvydx = 0; dvydy = 0; dvydz= 0;
dvzdx = 0; dvzdy = 0; dvzdz= 0;
grx = 0; gry = 0; grz= 0;
qiActive = 0;
for (i=0;i<nSmooth;++i) {
double fDist2 = nnList[i].fKey;
r2 = fDist2*ih2;
q = nnList[i].p;
if(q == NULL)
CkAbort("NULL neighbor in DenDvDxSmooth");
if (p->rung >= activeRung)
TYPESet(q,TYPE_NbrOfACTIVE); /* important for SPH */
if(q->rung >= activeRung)
qiActive = 1;
rs = KERNEL(r2, nSmooth);
fDensity += rs*q->mass;
rs1 = DKERNEL(r2);
rs1 *= q->mass;
dx = nnList[i].dx.x; /* NB: dx = px - qx */
dy = nnList[i].dx.y;
dz = nnList[i].dx.z;
dvx = (-p->vPred().x + q->vPred().x)*vFac;
dvy = (-p->vPred().y + q->vPred().y)*vFac;
dvz = (-p->vPred().z + q->vPred().z)*vFac;
dvxdx += dvx*dx*rs1;
dvxdy += dvx*dy*rs1;
dvxdz += dvx*dz*rs1;
dvydx += dvy*dx*rs1;
dvydy += dvy*dy*rs1;
dvydz += dvy*dz*rs1;
dvzdx += dvz*dx*rs1;
dvzdy += dvz*dy*rs1;
dvzdz += dvz*dz*rs1;
divvnorm += (dx*dx+dy*dy+dz*dz)*rs1;
/* Grad P estimate */
/* This used to be:
grx += (-p->uPred + q->uPred)*dx*rs1; But that is
rho grad u*/
grx += (q->uPred())*dx*rs1;
gry += (q->uPred())*dy*rs1;
grz += (q->uPred())*dz*rs1;
#ifdef CULLENALPHA
// Special weighting function to reduce noise in R
// calculation. See discussion after eq. 29 in
// Wadsley et al 2017.
double R_wt = (1-r2*r2*0.0625)* q->mass;
R_CD += q->dvds_old() * R_wt;
R_CDN += R_wt;
// Convention here dvdx = vxq-vxp, dx = xp-xq so
// dvdotdr = -dvx*dx ...
double dvdotdr = -(dvx*dx + dvy*dy + dvz*dz)
+ fDist2*H; // vFac already in there
double cavg = (p->c() + q->c())*0.5;
double vSig = cavg - (dvdotdr < 0 ? dvdotdr/sqrt(fDist2) : 0);
if (vSig > maxVSignal) maxVSignal = vSig;
#endif
}
if (qiActive)
TYPESet(p,TYPE_NbrOfACTIVE);
p->fDensity = fNorm*fDensity;
trace = dvxdx+dvydy+dvzdz;
// keep Norm positive consistent w/ std 1/rho norm
fNorm1 = (divvnorm != 0 ? 3.0/fabs(divvnorm) : 0.0);
#if defined(DIFFUSION) || defined(CULLENALPHA)
double onethirdtrace = (1./3.)*trace;
/* Build Traceless Strain Tensor (not yet normalized) */
double sxx = dvxdx - onethirdtrace; /* pure compression/expansion doesn't diffuse */
double syy = dvydy - onethirdtrace;
double szz = dvzdz - onethirdtrace;
double sxy = 0.5*(dvxdy + dvydx); /* pure rotation doesn't diffuse */
double sxz = 0.5*(dvxdz + dvzdx);
double syz = 0.5*(dvydz + dvzdy);
#endif
#ifdef DIFFUSION
/* diff coeff., nu ~ C L^2 S (add C via dMetalDiffusionConstant, assume L ~ h) */
if (bConstantDiffusion) p->diff() = 1;
else p->diff() = fNorm1*0.25*p->fBall*p->fBall*sqrt(2*(sxx*sxx + syy*syy + szz*szz + 2*(sxy*sxy + sxz*sxz + syz*syz)));
#endif
p->divv() = fNorm1*trace + 3.0*H; /* physical */
p->curlv().x = fNorm1*(dvzdy - dvydz);
p->curlv().y = fNorm1*(dvxdz - dvzdx);
p->curlv().z = fNorm1*(dvydx - dvxdy);
#ifdef CULLENALPHA
double alphaLoc, tau;
double l = 0.1;
double Hcorr = (fNorm1 != 0 ? H/fNorm1 : 0);
double gnorm = (grx*grx+gry*gry+grz*grz);
if (gnorm > 0) gnorm=1/sqrt(gnorm);
grx *= gnorm;
gry *= gnorm;
grz *= gnorm;
double dvdr = (((dvxdx+Hcorr)*grx+dvxdy*gry+dvxdz*grz)*grx
+ (dvydx*grx+(dvydy+Hcorr)*gry+dvydz*grz)*gry
+ (dvzdx*grx+dvzdy*gry+(dvzdz+Hcorr)*grz)*grz)*fNorm1;
double pdvds_old = p->dvds();
double dvds = (p->divv() < 0 ? 1.5*(dvdr -(1./3.)*p->divv()) : dvdr );
double sxxf = dvxdx+Hcorr, syyf = dvydy+Hcorr, szzf = dvzdz+Hcorr;
double SFull = sqrt(fNorm1*fNorm1*(sxxf*sxxf+syyf*syyf+szzf*szzf
+ 2*(sxy*sxy + sxz*sxz + syz*syz)));
p->dvdsOnSFull() = SFull > 0 ? dvds/SFull : 0;
#ifdef CD_SFULL
p->dvds() = p->dvdsOnSFull();
#else
p->dvds() = dvds;
#endif
// time interval = current time - last time divv was calculated
double deltaT = dTime - p->TimeDivV();
double divVDot = (p->dvds() - pdvds_old)/deltaT;
p->TimeDivV() = dTime;
// If we are initializing the simulation, the current time step is zero and we can't compute the time
// derivative of the velocity divergence in the Cullen & Dehnen formulation
if (bStarting && !bHaveAlpha){
// If the divergence of the velocity of the particle is negative and the speed of sound is nonzero
// we set p->CullenAlpha() using the M&M prescription. Otherwise p->CullenAlpha() is zero
if ((p->divv() < 0) && (p->c() > 0)){
tau = p->fBall / (2.0*l*maxVSignal);
alphaLoc = -dAlphaMax*p->divv()*tau / (1.0 - p->divv()*tau);
}
else alphaLoc = 0.0;
p->CullenAlpha() = alphaLoc;
}
// If the current time step > 0
else if(!bHaveAlpha) {
if (p->dvds() < 0 && divVDot < 0){ // Flow is converging and
// convergence is increasing
double OneMinusR_CD = (R_CDN > 0 ? 1-(R_CD/R_CDN) : 0);
double xi = (OneMinusR_CD < -1 ? 0 :
(OneMinusR_CD > 2 ? 1 : 0.0625*OneMinusR_CD*OneMinusR_CD*OneMinusR_CD*OneMinusR_CD));
// Multiplier for ATerm in CD viscosity.
const double dAFac = 2.0;
double Aterm = xi * p->fBall * p->fBall * fabs(divVDot)*dAFac;
// The local alpha value
alphaLoc = dAlphaMax* Aterm / (maxVSignal*maxVSignal + Aterm);
}
else alphaLoc = 0;
// Decay parameter
tau = 1. / (l*maxVSignal*ih);
// If alphaLoc is larger then the current p->CullenAlpha(), we set p->CullenAlhpa() to be equal to alphaLoc.
// Otherwise, we decay p->CullenAlpha() to the alphaLoc value
if (alphaLoc > p->CullenAlpha()) p->CullenAlpha() = alphaLoc;
else{
double oldCullenAlpha = p->CullenAlpha();
p->CullenAlpha() = alphaLoc - (alphaLoc - oldCullenAlpha)*exp(-deltaT/tau);
}
}
#endif /* CULLENALPHA */
}
void DenDvDxNeighborSmParams::postTreeParticle(GravityParticle *p)
{
#ifdef CULLENALPHA
if(p->isGas())
p->dvds_old() = p->dvdsOnSFull();
#endif
}
void
TreePiece::sphViscosityLimiter(int bOn, int activeRung, const CkCallback& cb)
{
int i;
GravityParticle *p;
// Pressure will be called next, so check this here.
CkAssert(bBucketsInited);
if (bOn) {
for(i=1; i<= myNumParticles; ++i) {
p = &myParticles[i];
/* Only set values for particles with fresh curlv, divv
from smooth */
if(TYPETest(p, TYPE_GAS) && p->rung >= activeRung) {
if (p->divv() != 0.0) {
p->BalsaraSwitch() = fabs(p->divv())/
(fabs(p->divv()) + sqrt(p->curlv().lengthSquared()));
}
else {
p->BalsaraSwitch() = 0.0;
}
}
}
}
else {
for(i=1; i<= myNumParticles; ++i) {
p = &myParticles[i];
if(TYPETest(p, TYPE_GAS)) {
p->BalsaraSwitch() = 1.0;
}
}
}
// Use shadow array to avoid reduction conflict
smoothProxy[thisIndex].ckLocal()->contribute(cb);
}
/* Note: Uses uPred */
void TreePiece::getAdiabaticGasPressure(double gamma, double gammam1,
double dtFacCourant,
const CkCallback &cb)
{
GravityParticle *p;
double PoverRho;
int i;
for(i=1; i<= myNumParticles; ++i) {
p = &myParticles[i];
if (TYPETest(p, TYPE_GAS)) {
PoverRho = gammam1*p->uPred();
p->PoverRho2() = PoverRho/p->fDensity;
p->c() = sqrt(gamma*PoverRho);
#ifdef DTADJUST
{
double uDot = p->PdV();
double dt;
if(uDot > 0.0)
dt = dtFacCourant*0.5*p->fBall
/sqrt(4.0*(p->c()*p->c() + GAMMA_NONCOOL*uDot*p->dt));
else
dt = dtFacCourant*0.5*p->fBall /(2.0*p->c());
// Update to scare the neighbors.
if(dt < p->dtNew()) p->dtNew() = dt;
}
#endif
}
}
// Use shadow array to avoid reduction conflict
smoothProxy[thisIndex].ckLocal()->contribute(cb);
}
/* Note: Uses uPred */
void TreePiece::getCoolingGasPressure(double gamma, double gammam1,
double dtFacCourant,
double dResolveJeans,
const CkCallback &cb)
{
#ifndef COOLING_NONE
GravityParticle *p;
double PoverRho;
int i;
COOL *cl = dm->Cool;
for(i=1; i<= myNumParticles; ++i) {
p = &myParticles[i];
if (TYPETest(p, TYPE_GAS)) {
double cGas;
CoolCodePressureOnDensitySoundSpeed(cl, &p->CoolParticle(),
p->uPred(), p->fDensity(),
gamma, gammam1, &PoverRho,
&cGas);
double dPoverRhoJeans = PoverRhoFloorJeans(dResolveJeans, p);
if(PoverRho < dPoverRhoJeans) PoverRho = dPoverRhoJeans;
p->PoverRho2() = PoverRho/p->fDensity;
p->c() = sqrt(cGas*cGas + GAMMA_JEANS*dPoverRhoJeans);
#ifdef DTADJUST
{
double uDot = p->uDot();
double dt;
if(uDot > 0.0)
dt = dtFacCourant*0.5*p->fBall
/sqrt(4.0*(p->c()*p->c() + GAMMA_NONCOOL*uDot*p->dt));
else
dt = dtFacCourant*0.5*p->fBall /(2.0*p->c());
// Update to scare the neighbors.
if(dt < p->dtNew()) p->dtNew() = dt;
}
#endif
}
}
#endif
// Use shadow array to avoid reduction conflict
smoothProxy[thisIndex].ckLocal()->contribute(cb);
}
int PressureSmoothParams::isSmoothActive(GravityParticle *p)
{
return (TYPETest(p, TYPE_NbrOfACTIVE));
}
/* Original Particle */
void PressureSmoothParams::initSmoothParticle(GravityParticle *p)
{
if (p->rung >= activeRung) {
p->mumax() = 0.0;
#ifdef DTADJUST
p->dtNew() = FLT_MAX;
#endif
p->PdV() = 0.0;
#ifdef DIFFUSION
p->fMetalsDot() = 0.0;
p->fMFracOxygenDot() = 0.0;
p->fMFracIronDot() = 0.0;
#endif /* DIFFUSION */
}
}
/* Cached copies of particle */
void PressureSmoothParams::initSmoothCache(GravityParticle *p)
{
if (p->rung >= activeRung) {
p->mumax() = 0.0;
#ifdef DTADJUST
p->dtNew() = FLT_MAX;
#endif
p->PdV() = 0.0;
p->treeAcceleration = 0.0;
#ifdef DIFFUSION
p->fMetalsDot() = 0.0;
p->fMFracOxygenDot() = 0.0;
p->fMFracIronDot() = 0.0;
#endif /* DIFFUSION */
}
}
void PressureSmoothParams::combSmoothCache(GravityParticle *p1,
ExternalSmoothParticle *p2)
{
if (p1->rung >= activeRung) {
p1->PdV() += p2->PdV;
if (p2->mumax > p1->mumax())
p1->mumax() = p2->mumax;
p1->treeAcceleration += p2->treeAcceleration;
#ifdef DIFFUSION
p1->fMetalsDot() += p2->fMetalsDot;
p1->fMFracOxygenDot() += p2->fMFracOxygenDot;
p1->fMFracIronDot() += p2->fMFracIronDot;
#endif /* DIFFUSION */
}
#ifdef DTADJUST
// All neighbors get their rungs adjusted.
if (p2->dtNew < p1->dtNew())
p1->dtNew() = p2->dtNew;
#endif
}
void PressureSmoothParams::fcnSmooth(GravityParticle *p, int nSmooth,
pqSmoothNode *nnList)
{
GravityParticle *q;
PressSmoothUpdate params;
PressSmoothParticle pParams;
PressSmoothParticle qParams;
double ih2,r2,rs1;
Vector3D<double> dv;
double ph,absmu;
double fNorm1,vFac;
double fDivv_Corrector;
double dt;
int i;
if(nSmooth < 2) {
CkError("WARNING: lonely SPH particle\n");
return;
}
#ifndef RTFORCE
pParams.PoverRho2 = p->PoverRho2();
pParams.PoverRho2f = pParams.PoverRho2;
#endif
ph = 0.5 * p->fBall;
ih2 = invH2(p);
fNorm1 = 0.5*M_1_PI*ih2*ih2/ph; /* converts to physical u */
params.aFac = a; /* comoving acceleration factor */
vFac = 1./(a*a); /* converts v to xdot */
#ifdef RTFORCE
double divvi = 0;
double divvj = 0;
for (i=0;i<nSmooth;++i) {
double fDist2 = nnList[i].fKey;
r2 = fDist2*ih2;
q = nnList[i].p;
rs1 = DKERNEL(r2);
rs1 *= fDist2*q->mass;
divvi += rs1;
divvj += rs1/q->fDensity;
}
divvi /= p->fDensity;
fDivv_Corrector = (divvj != 0.0 ? divvi/divvj : 1.0);
#else
fDivv_Corrector = 1.0;
#endif
for (i=0;i<nSmooth;++i) {
q = nnList[i].p;
if ((p->rung < activeRung) && (q->rung < activeRung)) continue;
double fDist2 = nnList[i].fKey;
r2 = fDist2*ih2;
rs1 = DKERNEL(r2);
rs1 *= fNorm1;
rs1 *= fDivv_Corrector;
pParams.rNorm = rs1 * p->mass;
qParams.rNorm = rs1 * q->mass;
params.dx = nnList[i].dx;
dv = p->vPred() - q->vPred();
params.dvdotdr = vFac*dot(dv, params.dx) + fDist2*H;
#ifdef RTFORCE
pParams.PoverRho2 = p->PoverRho2()*p->fDensity/q->fDensity;
pParams.PoverRho2f = pParams.PoverRho2;
qParams.PoverRho2 = q->PoverRho2()*q->fDensity/p->fDensity;
qParams.PoverRho2f = qParams.PoverRho2;
#else
qParams.PoverRho2 = q->PoverRho2();
qParams.PoverRho2f = qParams.PoverRho2;
#endif
/***********************************
* SPH Pressure Terms Calculation
***********************************/
/* Calculate Artificial viscosity term prefactor terms
*
* Updates:
* dt
* params.visc
*/
{ // Begin SPH pressure terms calculation and scope the variables below
if (params.dvdotdr>=0.0) {
dt = dtFacCourant*ph/(2*(p->c() > q->c() ? p->c() : q->c()));
params.visc = 0.0;
} else {
#ifdef VSIGVISC /* compile-time flag */
/* mu multiply by a to be consistent with physical c */
absmu = -params.dvdotdr*a/sqrt(fDist2);
/* mu terms for gas time step */
if (absmu>p->mumax()) p->mumax()=absmu;
if (absmu>q->mumax()) q->mumax()=absmu;
/* viscosity terms */
params.visc = (varAlpha(alpha, p, q)*(p->c() + q->c())
+ varBeta(beta, p, q)*1.5*absmu);
dt = dtFacCourant*ph/(0.625*(p->c() + q->c())+0.375*params.visc);
params.visc = switchCombine(p,q)*params.visc*absmu/(p->fDensity + q->fDensity);
#else
/* h mean */
double hav=0.5*(ph+0.5*q->fBall);
/* mu multiply by a to be consistent with physical c */
absmu = -hav*params.dvdotdr*a/(fDist2+0.01*hav*hav);
/* mu terms for gas time step */
if (absmu>p->mumax()) p->mumax()=absmu;
if (absmu>q->mumax()) q->mumax()=absmu;
/* viscosity terms */
params.visc = (varAlpha(alpha, p, q)*(p->c() + q->c()) \
+ varBeta(beta, p, q)*2*absmu);
dt = dtFacCourant*hav/(0.625*(p->c() + q->c())+0.375*params.visc);
params.visc = switchCombine(p,q)*params.visc*absmu/(p->fDensity + q->fDensity);
#endif //VSIGVISC
}
/* Calculate diffusion terms */
#ifdef DIFFUSION /* compile-time flag */
// Diffusion Base term
#ifdef DIFFUSIONHARMONIC /* compile-time flag */
double diffSum = (p->diff()+q->diff());
double diffBase = (diffusionLimitTest(diffSum, dTime, p, q) ? 0
: 4*p->diff()*q->diff()/diffSum);
#else
double diffSum = (p->diff()+q->diff());
double diffBase = (diffusionLimitTest(diffSum, dTime, p, q)
? 0 : diffSum);
#endif
// Metals Base term
/* massdiff not implemented */
// #ifdef MASSDIFF /* compile-time flag */
// double diffMetalsBase = 4*smf->dMetalDiffusionCoeff*diffBase \
// /((p->fDensity+q->fDensity)*(p->fMass+q->fMass));
// #else
double diffMetalsBase = 2*dMetalDiffusionCoeff*diffBase \
/(p->fDensity+q->fDensity);
// #endif //MASSDIFF
// Thermal diffusion
/*
* Updates:
* dt
* params.diffu
* diffTh
* params.diffuNc
*/
double diffTh;
// /* DIFFUSIONPRICE not implemented */
// #ifdef DIFFUSIONPRICE /* compile-time flag */
// {
// double irhobar = 2/(p->fDensity+q->fDensity);
// double vsig = sqrt(fabs(qParams.PoverRho2*q->fDensity*q->fDensity \
// - pParams.PoverRho2*p->fDensity*p->fDensity)\
// *irhobar);
// diffTh = smf->dThermalDiffusionCoeff*0.5 \
// * (ph+sqrt(0.25*BALL2(q)))*irhobar*vsig;
// params.diffu = diffTh*(p->uPred-q->uPred);
// }
// #else
#ifndef NODIFFUSIONTHERMAL /* compile-time flag */
{
diffTh = (2*dThermalDiffusionCoeff*diffBase/(p->fDensity+q->fDensity));
double dt_diff;
double dThermalCond;
// /* THERMALCOND not implemented */
// #ifdef THERMALCOND /* compile-time flag */
// #if (0)
// /* Harmonic average coeff */
// double dThermalCondSum = p->fThermalCond + q->fThermalCond;
// dThermalCond = ( dThermalCondSum <= 0 ? 0 \
// : 4*p->fThermalCond*q->fThermalCond \
// /(dThermalCondSum*p->fDensity*q->fDensity) );
// #else
// /* Arithmetic average coeff */
// dThermalCond = (p->fThermalCond + q->fThermalCond) \
// /(p->fDensity*q->fDensity);
// if (dThermalCond > 0 && (dt_diff = dtFacDiffusion*ph \
// *p->fThermalLength/(dThermalCond*p->fDensity)) < dt){
// dt = dt_diff;
// }
// #endif
// #else
dThermalCond = 0.0;
// #endif //THERMALCOND
if (diffTh > 0 && (dt_diff= dtFacDiffusion*ph*ph/(diffTh*p->fDensity)) < dt) dt = dt_diff;
params.diffu = (diffTh+dThermalCond)*(p->uPred()-q->uPred());
}
#endif
// #endif //DIFFUSIONPRICE
// /* not implemented */
// #ifdef UNONCOOL /* compile-time flag */
// params.diffuNc = diffTh*(p->uNoncoolPred-q->uNoncoolPred);
// #endif
// Calculate diffusion pre-factor terms (required for updating particles)
params.diffMetals = diffMetalsBase*(p->fMetals() - q->fMetals());
params.diffMetalsOxygen = diffMetalsBase*(p->fMFracOxygen() - q->fMFracOxygen());
params.diffMetalsIron = diffMetalsBase*(p->fMFracIron() - q->fMFracIron());
// /* not implemented */
// #ifdef MASSDIFF /* compile-time flag */
// params.diffMass = diffMetalsBase*(p->fMass - q->fMass);
// // To properly implement this in ChaNGa the correct velocity
// // should be chosen
// params.diffVelocity = diffMetalsBase * (p->velocity - q->velocity);
// #endif
#endif
if (p->rung >= activeRung) {
updateParticle(p, q, ¶ms, &pParams, &qParams, 1);
}
if (q->rung >= activeRung) {
updateParticle(q, p, ¶ms, &qParams, &pParams, -1);
}
// Adust dt
#ifdef DTADJUST /* compile-time flag */
if (dt < p->dtNew()) p->dtNew() = dt;
if (dt < q->dtNew()) q->dtNew() = dt;
if (4*q->dt < p->dtNew()) p->dtNew() = 4*q->dt;
if (4*p->dt < q->dtNew()) q->dtNew() = 4*p->dt;
#endif
} // End SPH Pressure Terms calculations
}
}
/**
* @brief updateParticle is used to update particle attributes during the
* SPH pressure terms calculations.
*
* The updating of particle p and the neighbor q during this loop is symmetric
* (up to a possible sign change). For example, to update p and its neighbor
* q is two lines:
* updateParticle(p, q, params, pParams, qParams, 1);
* updateParticle(q, p, params, qParams, pParams, -1);
* @param a particle to update
* @param b interacting neighbor particle
* @param params prefactor params
* @param aParams params specific to a
* @param bParams params specific to b
* @param sign 1 for a = p (the self particle) and -1 for a = q (the neighbor)
*/
void updateParticle(GravityParticle *a, GravityParticle *b,
PressSmoothUpdate *params, PressSmoothParticle *aParams,
PressSmoothParticle *bParams, int sign) {
double acc;
// Update diffusion terms
#ifdef DIFFUSION /* compile-time flag */
// Thermal diffusion
// /* not implemented */
// #ifdef DIFFUSIONPRICE /* compile-time flag */
// a->uDotDiff += sign * params->diffu * bParams->rNorm;
// #else
#ifndef NODIFFUSIONTHERMAL /* compile-time flag */
a->PdV() += sign * params->diffu * bParams->rNorm \
* massDiffFac(b);
#endif
// #endif //DIFFUSIONPRICE
// /* not implemented */
// #ifdef UNONCOOL /* compile-time flag */
// a->uNoncoolDotDiff += sign * params->diffuNc * bParams->rNorm;
// #endif
// Metals diffusion
a->fMetalsDot() += sign * params->diffMetals * bParams->rNorm
* massDiffFac(b);
a->fMFracOxygenDot() += sign * params->diffMetalsOxygen
* bParams->rNorm * massDiffFac(b);
a->fMFracIronDot() += sign * params->diffMetalsIron * bParams->rNorm
* massDiffFac(b);
// /* not implemented */
// #ifdef MASSDIFF /* compile-time flag */
// // Note: to implement this in ChaNGa, ACCEL should be properly vectorized
// a->fMassDot += sign * params->diffMass * a->fMass * bParams->rNorm;
// ACCEL(a) += sign * params->diffVelocity * bParams->rNorm \
// * massDiffFac(b);
// #endif
#endif
// Update pressure/viscosity terms
// /* not implemented */
// #ifdef DRHODT /* compile-time flag */
// a->fDivv_PdV -= bParams->rNorm / params->fDivv_Corrector / \
// rhoDivv(a->fDensity,b->fDensity) * params->dvdotdr;
// a->fDivv_PdVcorr -= bParams->rNorm / rhoDivv(a->fDensity,b->fDensity) \
// * params->dvdotdr;
// #endif
a->PdV() += bParams->rNorm*presPdv(aParams->PoverRho2, bParams->PoverRho2)
* params->dvdotdr;
a->PdV() += bParams->rNorm * 0.5 * params->visc * params->dvdotdr;
acc = presAcc(aParams->PoverRho2f, bParams->PoverRho2f) \
+ params->visc;
acc *= bParams->rNorm * params->aFac;
a->treeAcceleration -= sign * acc * params->dx;
}
/*
* Methods to distribute Deleted gas
*/
int DistDeletedGasSmoothParams::isSmoothActive(GravityParticle *p)
{
return (TYPETest(p, TYPE_DELETED) && TYPETest(p, iType));
}
void DistDeletedGasSmoothParams::initSmoothCache(GravityParticle *p)
{
if(!TYPETest(p, TYPE_DELETED)) {
/*
* Zero out accumulated quantities.
*/
p->mass = 0;
p->velocity[0] = 0;
p->velocity[1] = 0;
p->velocity[2] = 0;
#ifndef COOLING_NONE
p->u() = 0;
p->uDot() = 0.0;
#endif
p->fMetals() = 0.0;
p->fMFracIron() = 0.0;
p->fMFracOxygen() = 0.0;
}
}
void DistDeletedGasSmoothParams::combSmoothCache(GravityParticle *p1,
ExternalSmoothParticle *p2)
{
/*
* Distribute u, v, and fMetals for particles returning from cache
* so that everything is conserved nicely.
*/
if(!TYPETest((p1), TYPE_DELETED)) {
double delta_m = p2->mass;
double m_new,f1,f2;
double fTCool; /* time to cool to zero */
m_new = p1->mass + delta_m;
if (m_new > 0) {
f1 = p1->mass /m_new;
f2 = delta_m /m_new;
p1->mass = m_new;
p1->velocity = f1*p1->velocity + f2*p2->velocity;
p1->fMetals() = f1*p1->fMetals() + f2*p2->fMetals;
p1->fMFracIron() = f1*p1->fMFracIron() + f2*p2->fMFracIron;
p1->fMFracOxygen() = f1*p1->fMFracOxygen() + f2*p2->fMFracOxygen;
#ifndef COOLING_NONE
if(p1->uDot() < 0.0) /* margin of 1% to avoid roundoff
* problems */
fTCool = 1.01*p1->uPred()/p1->uDot();
p1->u() = f1*p1->u() + f2*p2->u;
p1->uPred() = f1*p1->uPred() + f2*p2->uPred;
if(p1->uDot() < 0.0)
p1->uDot() = p1->uPred()/fTCool;
#endif
}
}
}
void DistDeletedGasSmoothParams::fcnSmooth(GravityParticle *p, int nSmooth,
pqSmoothNode *nnList)
{
GravityParticle *q;
double fNorm,ih2,r2,rs,rstot,delta_m,m_new,f1,f2;
double fTCool; /* time to cool to zero */
int i;
CkAssert(TYPETest(p, TYPE_GAS));
ih2 = invH2(p);
rstot = 0;
for (i=0;i<nSmooth;++i) {
double fDist2 = nnList[i].fKey;
q = nnList[i].p;
if(TYPETest(q, TYPE_DELETED)) continue;
CkAssert(TYPETest(q, TYPE_GAS));
r2 = fDist2*ih2;
rs = KERNEL(r2, nSmooth);
rstot += rs;
}
if(rstot <= 0.0) {
if(p->mass == 0.0) /* the particle to be deleted has NOTHING */
return;
/* we have a particle to delete and nowhere to put its mass
* => we will keep it around */
unDeleteParticle(p);
return;
}
CkAssert(rstot > 0.0);
fNorm = 1./rstot;
CkAssert(p->mass >= 0.0);
for (i=0;i<nSmooth;++i) {
q = nnList[i].p;
if(TYPETest(q, TYPE_DELETED)) continue;
double fDist2 = nnList[i].fKey;
r2 = fDist2*ih2;
rs = KERNEL(r2, nSmooth);
/*
* All these quantities are per unit mass.
* Exact if only one gas particle being distributed or in serial
* Approximate in parallel (small error).
*/
delta_m = rs*fNorm*p->mass;
m_new = q->mass + delta_m;
/* Cached copies can have zero mass: skip them */
if (m_new == 0) continue;
f1 = q->mass /m_new;
f2 = delta_m /m_new;
q->mass = m_new;
q->velocity = f1*q->velocity + f2*p->velocity;
q->fMetals() = f1*q->fMetals() + f2*p->fMetals();
q->fMFracIron() = f1*q->fMFracIron() + f2*p->fMFracIron();
q->fMFracOxygen() = f1*q->fMFracOxygen() + f2*p->fMFracOxygen();
#ifndef COOLING_NONE
if(q->uDot() < 0.0) /* margin of 1% to avoid roundoff error */
fTCool = 1.01*q->uPred()/q->uDot();
q->u() = f1*q->u()+f2*p->u();
q->uPred() = f1*q->uPred()+f2*p->uPred();
if(q->uDot() < 0.0) /* make sure we don't shorten cooling time */
q->uDot() = q->uPred()/fTCool;
#endif
}
}